Moreza009
/

progen2-small-me-2

Model card Files Files and versions

Moreza009 commited on Jun 4, 2025

Commit

3aa5527

·

verified ·

1 Parent(s): 86f2a6b

Update modeling_progen.py

Files changed (1) hide show

modeling_progen.py +0 -4

modeling_progen.py CHANGED Viewed

@@ -613,11 +613,7 @@ class ProGenForCausalLM(ProGenPreTrainedModel):
         # compute loss in fp32 to match with mesh-tf version
         # https://github.com/EleutherAI/gpt-neo/blob/89ce74164da2fb16179106f54e2269b5da8db333/models/gpt2/gpt2.py#L179
         lm_logits = self.lm_head(hidden_states).to(torch.float32)
-        print(f"lm_logits = {lm_logits.shape}")
-        print(f"logits_to_keep = {logits_to_keep}")
-        # Debug shape
-        print(f"Final logits shape: {lm_logits.shape}")  # Should be [batch, seq, vocab]
         loss = None
         if labels is not None:
             # Shift so that tokens < n predict n

         # compute loss in fp32 to match with mesh-tf version
         # https://github.com/EleutherAI/gpt-neo/blob/89ce74164da2fb16179106f54e2269b5da8db333/models/gpt2/gpt2.py#L179
         lm_logits = self.lm_head(hidden_states).to(torch.float32)
         loss = None
         if labels is not None:
             # Shift so that tokens < n predict n