增加代码规范，删除一些无用的function

2025-06-03 21:55:06 +08:00 · 2022-12-15 05:03:26 +00:00 · 2022-12-15 05:03:26 +00:00 · f83ff59c97
commit f83ff59c97
parent 692b8d8c1f
10 changed files with 10 additions and 309 deletions
--- a/docs/zh_CN/training/semi_supervised_learning/FixMatchCCSSL.md
+++ b/docs/zh_CN/training/semi_supervised_learning/FixMatchCCSSL.md
@ -79,14 +79,14 @@ python tools/train.py -c ppcls/configs/ssl/FixMatchCCSSL/FixMatchCCSSL_cifar10_4
 python -m paddle.distributed.launch --gpus='0,1,2,3' tools/train.py -c ppcls/configs/ssl/FixMatchCCSSL/FixMatchCCSSL_cifar10_4000_4gpu.yaml
 ```

-2. **查看训练日志和保存的模型参数文件** 训练过程中屏幕会实时打印loss等指标信息，同时会保存日志文件 `train.log` ，模型参数文件 `*.pdparams`，优化器参数文件 `*.pdopt` 等内容到`Global.output_dir`指定的文件夹下，默认在 `PaddleClas/output/WideResNet/`文件夹下。
+2. **查看训练日志和保存的模型参数文件** 训练过程中屏幕会实时打印loss等指标信息，同时会保存日志文件 `train.log` ，模型参数文件 `*.pdparams`，优化器参数文件 `*.pdopt` 等内容到`Global.output_dir`指定的文件夹下，默认在 `PaddleClas/output/RecModel/`文件夹下。

 ## 5. 模型评估与推理部署
 ### 5.1 模型评估
 准备用于评估的 `*.pdparams` 模型参数文件，可以使用训练好的模型，也可以使用 *4. 模型训练* 中保存的模型。
 * 以训练过程中保存的 `best_model_ema.ema.pdparams`为例，执行如下命令即可进行评估。
 ```
-python3.7 tools/eval.py -c ppcls/configs/ssl/FixMatchCCSSL/FixMatchCCSSL_cifar10_4000_4gpu.yaml -o Global.pretrained_model="./output/WideResNet/best_model_ema.ema"
+python3.7 tools/eval.py -c ppcls/configs/ssl/FixMatchCCSSL/FixMatchCCSSL_cifar10_4000_4gpu.yaml -o Global.pretrained_model="./output/RecModel/best_model_ema.ema"
 ```

 * 以训练好的模型为例，下载提供的已经训练好的模型，到 `PaddleClas/pretrained_models` 文件夹中，执行如下命令即可进行评估。
@ -98,7 +98,7 @@ cd pretrained_models
 wget 
 cd ..
 # 评估
-python3.7 tools/eval.py -c ppcls/configs/ssl/FixMatch_CCSSL_cifar10_4000.yaml -o Global.pretrained_model=""
+python3.7 tools/eval.py -c ppcls/configs/ssl/FixMatchCCSSL_cifar10_4000.yaml -o Global.pretrained_model="./output/RecModel/best_model_ema.ema"
 ```
 **注：** `pretrained_model` 后填入的地址不需要加 `.pdparams`后缀，在程序运行时会自动补上。

@ -114,15 +114,15 @@ python3.7 tools/eval.py -c ppcls/configs/ssl/FixMatch_CCSSL_cifar10_4000.yaml -o
 [2022/12/08 09:36:16] ppcls INFO: [Eval][Epoch 0][Iter: 140/157]CELoss: 0.03242, loss: 0.03242, top1: 0.95601, top5: 0.99945, batch_cost: 0.02084s, reader_cost: 0.00075, ips: 3071.00311 images/sec
 [2022/12/08 09:36:16] ppcls INFO: [Eval][Epoch 0][Avg]CELoss: 0.16041, loss: 0.16041, top1: 0.95610, top5: 0.99950
 ```
-默认评估日志保存在 `PaddleClas/output/WideResNetCCSSL/eval.log`中，可以看到我们提供的模型在cifar10数据集上的评估指标为top1: 95.61, top5: 99.95
+默认评估日志保存在 `PaddleClas/output/RecModel/eval.log`中，可以看到我们提供的模型在cifar10数据集上的评估指标为top1: 95.57, top5: 99.95

 ### 5.2 模型推理
 #### 5.2.1 推理模型准备
 将训练过程中保存的模型文件转成inference模型，同样以 `best_model_ema.ema_pdparams`为例，执行以下命令进行转换
 ```
 python3.7 tools/export_model.py \
-c ppcls/configs/ssl/FixMatch_CCSSL/FixMatch_CCSSL_cifar10_4000.yaml \
-o Global.pretrained_model="output/WideResNetCCSSL/best_model_ema.ema" \
+-c ppcls/configs/ssl/FixMatchCCSSL/FixMatchCCSSL_cifar10_4000.yaml \
+-o Global.pretrained_model="output/RecModel/best_model_ema.ema" \
 -o Global.save_inference_fir="./deploy/inference"
 ```

--- a/ppcls/arch/gears/decoup.py
+++ b/ppcls/arch/gears/decoup.py
@ -1,16 +0,0 @@
-import paddle
-import paddle.nn as nn
-
-
-class Decoup(nn.Layer):
-    def __init__(self, logits_index, features_index, **kwargs):
-        super(Decoup, self).__init__()
-        self.logits_index = logits_index
-        self.features_index = features_index
-
-
-    def forward(self, out, **kwargs):
-        assert isinstance(out, (list, tuple)), 'out must  be list or tuple'
-        out = {'logits': out[self.logits_index], 'features':out[self.features_index]}
-        return out
-
--- a/ppcls/configs/ssl/FixMatchCCSSL/FixMatchCCSSL_cifar10_4000_4gpu.yaml
+++ b/ppcls/configs/ssl/FixMatchCCSSL/FixMatchCCSSL_cifar10_4000_4gpu.yaml
@ -64,10 +64,9 @@ Optimizer:
  use_nesterov: true
  weight_decay: 0.001
  lr:
-    name: 'cosine_schedule_with_warmup'
+    name: 'CosineFixmatch'
    learning_rate: 0.03
    num_warmup_steps: 0
-    num_training_steps: 524800

 DataLoader:
  mean: [0.4914, 0.4822, 0.4465]
--- a/ppcls/data/dataloader/init.py
+++ b/ppcls/data/dataloader/init.py
@ -13,4 +13,3 @@ from ppcls.data.dataloader.person_dataset import Market1501, MSMT17
 from ppcls.data.dataloader.face_dataset import AdaFaceDataset, FiveValidationDataset
 from ppcls.data.dataloader.custom_label_dataset import CustomLabelDataset
 from ppcls.data.dataloader.cifar import Cifar10, Cifar100
-# from ppcls.data.dataloader.cifar import CIFAR10SSL, CIFAR100SSL
--- a/ppcls/data/dataloader/cifar.py
+++ b/ppcls/data/dataloader/cifar.py
@ -15,16 +15,11 @@
 from __future__ import print_function
 import numpy as np
 import cv2
-import shutil
 from ppcls.data import preprocess
 from ppcls.data.preprocess import transform
-# from ppcls.data.preprocess import BaseTransform, ListTransform
 from ppcls.data.dataloader.common_dataset import create_operators
 from paddle.vision.datasets import Cifar10 as Cifar10_paddle
 from paddle.vision.datasets import Cifar100 as Cifar100_paddle
-# from paddle.vision.datasets import cifar
-import os
-# from PIL import Image


 class Cifar10(Cifar10_paddle):
@ -128,176 +123,4 @@ class Cifar100(Cifar100_paddle):
            image3 = transform(image, self._transform_ops_strong)
            image3 = image3.transpose((2, 0, 1))

-            return (image2, image3, np.int64(label))
-
-
-# def np_convert_pil(array):
-#     """
-#     array conver image
-#     Args:
-#         array: array and dim is 1
-#     """
-#     assert len(array.shape), "dim of array should 1"
-#     img = Image.fromarray(array.reshape(3, 32, 32).transpose(1, 2, 0))
-#     return img
-
-
-# class CIFAR10(cifar.Cifar10):
-#     """
-#     cifar10 dataset
-#     """
-#     def __init__(self, data_file, download=True, mode='train'):
-#         super().__init__(download=download, mode=mode)
-#         if data_file is not None:
-#             os.makedirs(data_file, exist_ok=True)
-#             if not os.path.exists(os.path.join(data_file, 'cifar-10-python.tar.gz')):
-#                 shutil.move('~/.cache/paddle/dataset/cifar/cifar-10-python.tar.gz', data_file)
-#         self.num_classes = 10
-#         self.x = []
-#         self.y = []
-#         for d in self.data:
-#             self.x.append(d[0])
-#             self.y.append(d[1])
-
-#         self.x = np.array(self.x)
-#         self.y = np.array(self.y)
-
-#     def __getitem__(self, idx):
-#         return self.x[idx], self.y[idx]
-
-#     def __len__(self):
-#         return self.x.shape[0]
-
-
-# class CIFAR100(cifar.Cifar100):
-#     """
-#     cifar10 dataset
-#     """
-#     def __init__(self, data_file, download=True, mode='train'):
-#         super().__init__(download=download, mode=mode)
-#         if data_file is not None:
-#             os.makedirs(data_file, exist_ok=True)
-#             if not os.path.exists(os.path.join(data_file, 'cifar-100-python.tar.gz')):
-#                 shutil.move('~/.cache/paddle/dataset/cifar/cifar-100-python.tar.gz', data_file)
-#         self.num_classes = 100
-#         self.x = []
-#         self.y = []
-#         for d in self.data:
-#             self.x.append(d[0])
-#             self.y.append(d[1])
-
-#         self.x = np.array(self.x)
-#         self.y = np.array(self.y)
-
-#     def __getitem__(self, idx):
-#         return self.x[idx], self.y[idx]
-
-#     def __len__(self):
-#         return self.x.shape[0]
-
-
-# class CIFAR10SSL(CIFAR10):
-#     """
-#     from Cifar10
-#     """
-
-#     def __init__(self, 
-#                  data_file=None, 
-#                  sample_per_label=None, 
-#                  download=True,
-#                  expand_labels=1,
-#                  mode='train',
-#                  transform_ops=None,
-#                  transform_w=None,
-#                  transform_s1=None,
-#                  transform_s2=None):
-#         super().__init__(data_file, download=download, mode=mode)
-#         self.data_type = 'unlabeled_train' if mode == 'train' else 'val'
-#         if transform_ops is not None and sample_per_label is not None:
-#             index = []
-#             self.data_type = 'labeled_train'
-#             for c in range(self.num_classes):
-#                 idx = np.where(self.y == c)[0]
-#                 idx = np.random.choice(idx, sample_per_label, False)
-#                 index.extend(idx)
-#             index = index * expand_labels
-#             # print(index)
-#             self.x = self.x[index]
-#             self.y = self.y[index]
-#         self.transforms = [transform_ops] if transform_ops is not None else [transform_w, transform_s1, transform_s2]
-#         self.mode = mode
-
-#     def __getitem__(self, idx):
-#         img, label = np_convert_pil(self.x[idx]), self.y[idx]
-#         results = ListTransform(self.transforms)(img)
-#         if self.data_type == 'unlabeled_train':
-#             return results
-#         return results[0], label
-        
-#     def __len__(self):
-#         return self.x.shape[0]
-        
-
-
-
-# class CIFAR100SSL(CIFAR100):
-#     """
-#     from Cifar100
-#     """
-
-#     def __init__(self, 
-#                  data_file=None, 
-#                  sample_per_label=None, 
-#                  download=True,
-#                  expand_labels=1,
-#                  mode='train',
-#                  transform_ops=None,
-#                  transform_w=None,
-#                  transform_s1=None,
-#                  transform_s2=None):
-#         super().__init__(data_file, download=download, mode=mode)
-#         self.data_type = 'unlabeled_train' if mode == 'train' else 'val'
-#         if transform_ops is not None and sample_per_label is not None:
-#             index = []
-#             self.data_type = 'labeled_train'
-#             for c in range(self.num_classes):
-#                 idx = np.where(self.y == c)[0]
-#                 idx = np.random.choice(idx, sample_per_label, False)
-#                 index.extend(idx)
-#             index = index * expand_labels
-#             # print(index)
-#             self.x = self.x[index]
-#             self.y = self.y[index]
-#         self.transforms = [transform_ops] if transform_ops is not None else [transform_w, transform_s1, transform_s2]
-#         self.mode = mode
-
-#     def __getitem__(self, idx):
-#         img, label = np_convert_pil(self.x[idx]), self.y[idx]
-#         results = ListTransform(self.transforms)(img)
-#         if self.data_type == 'unlabeled_train':
-#             return results
-#         return results[0], label
-        
-#     def __len__(self):
-#         return self.x.shape[0]
-
-
-# def x_u_split(num_labeled, num_classes, label):
-#     """
-#     split index of dataset to labeled x and unlabeled u
-#     Args:
-#         num_labeled: num of labeled dataset
-#         label: list or array, label
-#     """
-#     assert num_labeled <= len(label), "arg num_labeled should <= num of label"
-#     label = np.array(label) if isinstance(label, list) else label
-#     label_per_class = num_labeled // num_classes
-#     labeled_idx = []
-#     unlabeled_idx = np.array(list(range(label.shape[0])))
-#     for c in range(num_classes):
-#         idx = np.where(label == c)[0]
-#         idx = np.random.choice(idx, label_per_class, False)
-#         labeled_idx.extend(idx)
-    
-#     np.random.shuffle(labeled_idx)
-#     return labeled_idx, unlabeled_idx
+            return (image2, image3, np.int64(label))
--- a/ppcls/data/preprocess/init.py
+++ b/ppcls/data/preprocess/init.py
@ -56,8 +56,6 @@ from ppcls.data.preprocess.batch_ops.batch_operators import MixupCutmixHybrid
 import numpy as np
 from PIL import Image
 import random
-from paddle.vision.transforms import transforms as T
-from paddle.vision.transforms.transforms import RandomCrop, ToTensor, Normalize


 def transform(data, ops=[]):
@ -123,41 +121,4 @@ class TimmAutoAugment(RawTimmAutoAugment):
            img = np.asarray(img)

        return img
-
-
-# class BaseTransform:
-#     def __init__(self, cfg) -> None:
-#         """
-#         Args:
-#             cfg: list [dict, dict, dict]
-#         """
-#         ts = []
-#         for op in cfg:
-#             name = list(op.keys())[0]
-#             if op[name] is None:
-#                 ts.append(eval(name)())
-#             else:
-#                 ts.append(eval(name)(**(op[name])))
-
-#         self.t = T.Compose(ts)
-
-#     def __call__(self, img):
-        
-#         return self.t(img)
-
-
-# class ListTransform:
-#     def __init__(self, ops) -> None:
-#         """
-#         Args:
-#             ops: list[list[dict, dict], ...]
-#         """
-#         self.ts = []
-#         for op in ops:
-#             self.ts.append(BaseTransform(op))
-
-#     def __call__(self, img):
-#         results = []
-#         for op in self.ts:
-#             results.append(op(img))
-#         return results
+        
--- a/ppcls/loss/init.py
+++ b/ppcls/loss/init.py
@ -22,7 +22,6 @@ from .pairwisecosface import PairwiseCosface
 from .dmlloss import DMLLoss
 from .distanceloss import DistanceLoss
 from .softtargetceloss import SoftTargetCrossEntropy
-from .ccssl_loss import CCSSLLoss
 from .distillationloss import DistillationCELoss
 from .distillationloss import DistillationGTCELoss
 from .distillationloss import DistillationDMLLoss
--- a/ppcls/loss/ccssl_loss.py
+++ b/ppcls/loss/ccssl_loss.py
@ -1,53 +1,14 @@
-
 from ppcls.engine.train.train import forward
 from .softsuploss import SoftSupConLoss
 import copy
 import paddle.nn as nn


-class CCSSLLoss(nn.Layer):
-    def __init__(self, **kwargs):
-        super(CCSSLLoss, self).__init__()
-        ce_cfg = copy.deepcopy(kwargs['CELoss'])
-        self.ce_weight = ce_cfg.pop('weight')
-        softsupconloss_cfg = copy.deepcopy(kwargs['SoftSupConLoss'])
-        self.softsupconloss_weight = softsupconloss_cfg.pop('weight')
-
-        self.softsuploss = SoftSupConLoss(**softsupconloss_cfg)
-        self.celoss = nn.CrossEntropyLoss(reduction='none')
-
-    def forward(self, feats, batch, **kwargs):
-        """
-        Args:
-            feats: feature of s1 and s2, (n, 2, d)
-            batch: dict 
-        """
-        logits_w = batch['logits_w']
-        logits_s1 = batch['logits_s1']
-        p_targets_u_w = batch['p_targets_u_w']
-        mask = batch['mask']
-
-        max_probs = batch['max_probs']
-        # reduction = batch['reduction']
-       
-
-        loss_u = self.celoss(logits_s1, p_targets_u_w) * mask
-        loss_u = loss_u.mean()
-
-        loss_c = self.softsuploss(feats, max_probs, p_targets_u_w)
-
-        return {'CCSSLLoss': self.ce_weight*loss_u + self.softsupconloss_weight * loss_c}
-
-
-
-
-
 class CCSSLCeLoss(nn.Layer):
    def __init__(self, **kwargs):
        super(CCSSLCeLoss, self).__init__()
        self.celoss = nn.CrossEntropyLoss(reduction='none')

-
    def forward(self, inputs, batch, **kwargs):
        p_targets_u_w = batch['p_targets_u_w']
        logits_s1 = batch['logits_s1']
@ -56,6 +17,3 @@ class CCSSLCeLoss(nn.Layer):
        loss_u = loss_u.mean()

        return {'CCSSLCeLoss': loss_u}
-
-
-
--- a/ppcls/loss/softsuploss.py
+++ b/ppcls/loss/softsuploss.py
@ -41,7 +41,6 @@ class SoftSupConLoss(nn.Layer):
            
            score_mask = paddle.matmul(max_probs, max_probs.T)
            
-            
            mask = paddle.multiply(mask, score_mask)
            
        contrast_count = feat.shape[1]
@ -55,7 +54,6 @@ class SoftSupConLoss(nn.Layer):
        mask = paddle.concat([mask, mask], axis=0)
        mask = paddle.concat([mask, mask], axis=1)
        
-        # mask = paddle.repeat_interleave(paddle.repeat_interleave(mask, 2, 0), 2, 1)
        logits_mask = 1 - paddle.eye(batch_size * contrast_count, dtype=paddle.float64)
        mask = mask * logits_mask
        exp_logits = paddle.exp(logits) * logits_mask
@ -68,6 +66,4 @@ class SoftSupConLoss(nn.Layer):
            loss = loss.mean()

        return {"SoftSupConLoss": loss}
-    
-
-
+    
--- a/ppcls/optimizer/learning_rate.py
+++ b/ppcls/optimizer/learning_rate.py
@ -519,21 +519,3 @@ class CosineFixmatch(LRBase):
            last_epoch=self.last_epoch)
        setattr(learning_rate, "by_epoch", self.by_epoch)
        return learning_rate
-
-
-
-def cosine_schedule_with_warmup(learning_rate,
-                                num_warmup_steps,
-                                num_training_steps,
-                                num_cycles=7./16,
-                                last_epoch=-1,
-                                **kwargs):
-    
-    def _lr_lambda(current_step):
-        if current_step < num_warmup_steps:
-            return float(current_step) /  float(max(1, num_warmup_steps))
-        no_progress = float(current_step - num_warmup_steps) / float(max(1, num_training_steps - num_warmup_steps))
-        return max(0., math.cos(math.pi * num_cycles * no_progress))
-
-    return lr.LambdaDecay(learning_rate=learning_rate, lr_lambda=_lr_lambda)
-