remove docstrings
Browse files
myolmoe/modeling_myolmoe.py
CHANGED
|
@@ -552,7 +552,7 @@ class OlmoeDecoderLayer(nn.Module):
|
|
| 552 |
return outputs
|
| 553 |
|
| 554 |
|
| 555 |
-
|
| 556 |
class OlmoePreTrainedModel(PreTrainedModel):
|
| 557 |
config_class = OlmoeConfig
|
| 558 |
base_model_prefix = "model"
|
|
@@ -579,7 +579,7 @@ class OlmoePreTrainedModel(PreTrainedModel):
|
|
| 579 |
module.weight.data[module.padding_idx].zero_()
|
| 580 |
|
| 581 |
|
| 582 |
-
|
| 583 |
class OlmoeModel(OlmoePreTrainedModel):
|
| 584 |
def __init__(self, config: OlmoeConfig):
|
| 585 |
super().__init__(config)
|
|
@@ -605,7 +605,7 @@ class OlmoeModel(OlmoePreTrainedModel):
|
|
| 605 |
def set_input_embeddings(self, value):
|
| 606 |
self.embed_tokens = value
|
| 607 |
|
| 608 |
-
|
| 609 |
def forward(
|
| 610 |
self,
|
| 611 |
input_ids: Optional[torch.LongTensor] = None,
|
|
@@ -872,7 +872,7 @@ class OlmoeForCausalLM(OlmoePreTrainedModel, GenerationMixin):
|
|
| 872 |
def get_decoder(self):
|
| 873 |
return self.model
|
| 874 |
|
| 875 |
-
|
| 876 |
def forward(
|
| 877 |
self,
|
| 878 |
input_ids: Optional[torch.LongTensor] = None,
|
|
|
|
| 552 |
return outputs
|
| 553 |
|
| 554 |
|
| 555 |
+
|
| 556 |
class OlmoePreTrainedModel(PreTrainedModel):
|
| 557 |
config_class = OlmoeConfig
|
| 558 |
base_model_prefix = "model"
|
|
|
|
| 579 |
module.weight.data[module.padding_idx].zero_()
|
| 580 |
|
| 581 |
|
| 582 |
+
|
| 583 |
class OlmoeModel(OlmoePreTrainedModel):
|
| 584 |
def __init__(self, config: OlmoeConfig):
|
| 585 |
super().__init__(config)
|
|
|
|
| 605 |
def set_input_embeddings(self, value):
|
| 606 |
self.embed_tokens = value
|
| 607 |
|
| 608 |
+
|
| 609 |
def forward(
|
| 610 |
self,
|
| 611 |
input_ids: Optional[torch.LongTensor] = None,
|
|
|
|
| 872 |
def get_decoder(self):
|
| 873 |
return self.model
|
| 874 |
|
| 875 |
+
|
| 876 |
def forward(
|
| 877 |
self,
|
| 878 |
input_ids: Optional[torch.LongTensor] = None,
|