fix layer key name for dynamic lr in adamwdl optimizer

2025-06-03 21:55:06 +08:00 · 2023-05-24 12:17:53 +00:00 · 2023-05-24 12:17:53 +00:00 · 042d1e7ef8
commit 042d1e7ef8
parent 80ae9079cd
1 changed files with 4 additions and 1 deletions
--- a/ppcls/optimizer/optimizer.py
+++ b/ppcls/optimizer/optimizer.py
@ -411,7 +411,10 @@ class AdamWDL(object):
                idx = static_name.find("blocks.")
                layer = int(static_name[idx:].split(".")[1])
                ratio = decay_rate**(n_layers - layer)
-            elif "embed" in static_name:
+            elif any([
+                    key in static_name
+                    for key in ["embed", "token", "conv1", "ln_pre"]
+            ]):
                ratio = decay_rate**(n_layers + 1)
            # param.optimize_attr["learning_rate"] *= ratio
            return ratio