Include original (pre-normalize) FQN in is_muon logging

Show both normalized and original parameter names so wrapper-injected
components (_orig_mod, _checkpoint_wrapped_module) are visible in logs.

[skip-build]

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

Files changed (1) hide show

torch-ext/optimizer/core.py +8 -6

torch-ext/optimizer/core.py CHANGED Viewed

@@ -92,20 +92,22 @@ def adjust_lr_for_muon(lr, param_shape):
 def default_is_muon(name, x, expert_keys=None):
-    parts = normalize_fqn(name).split(".")
     skip_keys = ["embed_tokens", "lm_head", "tok_embeddings", "output"]
     if any(key in parts for key in skip_keys):
-        logger.info("[is_muon] %s: skip (matched skip_key), ndim=%d", name,
-                    x.ndim)
         return False
     effective_ndim = x.ndim
     is_expert = expert_keys and any(key in parts for key in expert_keys)
     if is_expert:
         effective_ndim -= 1
     result = effective_ndim >= 2
-    logger.info("[is_muon] %s: ndim=%d, expert=%s, effective_ndim=%d → %s",
-                name, x.ndim, is_expert, effective_ndim,
-                "Muon" if result else "AdamW")
     return result

 def default_is_muon(name, x, expert_keys=None):
+    normalized = normalize_fqn(name)
+    parts = normalized.split(".")
     skip_keys = ["embed_tokens", "lm_head", "tok_embeddings", "output"]
     if any(key in parts for key in skip_keys):
+        logger.info("[is_muon] %s (orig: %s): skip (matched skip_key), ndim=%d",
+                    normalized, name, x.ndim)
         return False
     effective_ndim = x.ndim
     is_expert = expert_keys and any(key in parts for key in expert_keys)
     if is_expert:
         effective_ndim -= 1
     result = effective_ndim >= 2
+    logger.info(
+        "[is_muon] %s (orig: %s): ndim=%d, expert=%s, effective_ndim=%d → %s",
+        normalized, name, x.ndim, is_expert, effective_ndim,
+        "Muon" if result else "AdamW")
     return result