fig goooglenet distributed eval bug

2025-06-03 21:55:06 +08:00 · 2021-10-26 11:56:30 +00:00 · 2021-10-26 11:56:30 +00:00 · 2062c20cd8
commit 2062c20cd8
parent c30b72c867
1 changed files with 15 additions and 5 deletions
--- a/ppcls/engine/evaluation/classification.py
+++ b/ppcls/engine/evaluation/classification.py
@ -73,14 +73,24 @@ def classification_eval(engine, epoch_id=0):
        # calc metric
        if engine.eval_metric_func is not None:
            if paddle.distributed.get_world_size() > 1:
                pred_list = []
                label_list = []
                paddle.distributed.all_gather(label_list, batch[1])
                labels = paddle.concat(label_list, 0)
                if isinstance(out, dict):
                    out = out["logits"]
-                paddle.distributed.all_gather(pred_list, out)
+                if isinstance(out, list):
-                paddle.distributed.all_gather(label_list, batch[1])
+                    pred = []
-                pred = paddle.concat(pred_list, 0)
+                    for x in out:
-                labels = paddle.concat(label_list, 0)
+                        pred_list = []
                        paddle.distributed.all_gather(pred_list, x)
                        pred_x = paddle.concat(pred_list, 0)
                        pred.append(pred_x)
                else:
                    pred_list = []
                    paddle.distributed.all_gather(pred_list, out)
                    pred = paddle.concat(pred_list, 0)
                if accum_samples > total_samples:
                    pred = pred[:total_samples + current_samples -
                                accum_samples]