Charlie81 commited on
Commit
3325c29
·
1 Parent(s): d121ac8

revert variable assignment hidden states shape

Browse files
Files changed (1) hide show
  1. modeling_myolmoe.py +1 -1
modeling_myolmoe.py CHANGED
@@ -319,7 +319,7 @@ class MyOLMoESparseMoeBlock(nn.Module):
319
 
320
  def forward(self, hidden_states: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
321
  print(f"DEBUG: MoE forward start - hidden_states shape: {hidden_states.shape}")
322
- batch_size, seq_len = hidden_states.shape
323
  hidden_states = hidden_states.view(-1, self.hidden_size)
324
 
325
  # Get routing weights and selected experts
 
319
 
320
  def forward(self, hidden_states: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
321
  print(f"DEBUG: MoE forward start - hidden_states shape: {hidden_states.shape}")
322
+ batch_size, seq_len, _ = hidden_states.shape
323
  hidden_states = hidden_states.view(-1, self.hidden_size)
324
 
325
  # Get routing weights and selected experts