tencent
/

Youtu-LLM-2B

Text Generation

Model card Files Files and versions

Junrulu commited on 15 days ago

Commit

459fda5

·

verified ·

1 Parent(s): 108c40a

remove redundant function

Files changed (1) hide show

modeling_youtu.py +0 -24

modeling_youtu.py CHANGED Viewed

@@ -414,30 +414,6 @@ class YoutuPreTrainedModel(PreTrainedModel):
         "attentions": YoutuMLAttention,
     }
-    def init_weights(self):
-        """
-        If needed prunes and maybe initializes weights. If using a custom `PreTrainedModel`, you need to implement any
-        initialization logic in `_init_weights`.
-        """
-        # Prune heads if needed
-        if self.config.pruned_heads:
-            self.prune_heads(self.config.pruned_heads)
-        if "-init" in self.name_or_path:
-            # Initialize weights
-            self.apply(self._initialize_weights)
-            # Adjust weights of o_proj in Attention and down_proj in MLP
-            for name, module in self.named_modules():
-                if "o_proj" in name or "down_proj" in name:
-                    # For the output projection, we reinitialize the weights
-                    scaled_std = self.config.initializer_range * (1.0 / self.config.num_hidden_layers) ** 0.5
-                    module.weight.data.normal_(mean=0.0, std=scaled_std)
-            # Tie weights should be skipped when not initializing all weights
-            # since from_pretrained(...) calls tie weights anyways
-            self.tie_weights()
     def _init_weights(self, module):
         super()._init_weights(module)
         std = self.config.initializer_range

         "attentions": YoutuMLAttention,
     }
     def _init_weights(self, module):
         super()._init_weights(module)
         std = self.config.initializer_range