name
Browse files
myolmoe/modeling_myolmoe.py
CHANGED
|
@@ -1073,7 +1073,7 @@ class MyOlmoeForCausalLM(OlmoePreTrainedModel, GenerationMixin):
|
|
| 1073 |
#
|
| 1074 |
return MoeCausalLMOutputWithPast(
|
| 1075 |
loss=loss,
|
| 1076 |
-
aux_loss=
|
| 1077 |
logits=logits,
|
| 1078 |
past_key_values=outputs.past_key_values,
|
| 1079 |
hidden_states=outputs.hidden_states,
|
|
|
|
| 1073 |
#
|
| 1074 |
return MoeCausalLMOutputWithPast(
|
| 1075 |
loss=loss,
|
| 1076 |
+
aux_loss=total_aux_loss,
|
| 1077 |
logits=logits,
|
| 1078 |
past_key_values=outputs.past_key_values,
|
| 1079 |
hidden_states=outputs.hidden_states,
|