zai-org
/

chatglm3-6b

Model card Files Files and versions

fix rmsnorm init weight bug.

#59

by Shan1990 - opened Jul 31, 2024

base: refs/heads/main

←

from: refs/pr/59

Discussion Files changed

Files changed (1) hide show

modeling_chatglm.py +1 -1

modeling_chatglm.py CHANGED Viewed

@@ -181,7 +181,7 @@ def apply_rotary_pos_emb(x: torch.Tensor, rope_cache: torch.Tensor) -> torch.Ten
 class RMSNorm(torch.nn.Module):
     def __init__(self, normalized_shape, eps=1e-5, device=None, dtype=None, **kwargs):
         super().__init__()
-        self.weight = torch.nn.Parameter(torch.empty(normalized_shape, device=device, dtype=dtype))
         self.eps = eps
     def forward(self, hidden_states: torch.Tensor):

 class RMSNorm(torch.nn.Module):
     def __init__(self, normalized_shape, eps=1e-5, device=None, dtype=None, **kwargs):
         super().__init__()
+        self.weight = torch.nn.Parameter(torch.ones(normalized_shape, device=device, dtype=dtype))
         self.eps = eps
     def forward(self, hidden_states: torch.Tensor):