robinfaro
/

molm_log_prob

Text Generation

Model card Files Files and versions

robinfaro commited on Jun 24, 2025

Commit

6896b8f

·

verified ·

1 Parent(s): b2ca9ad

Adding modeling.py file

Files changed (1) hide show

modeling.py +3 -3

modeling.py CHANGED Viewed

@@ -107,7 +107,7 @@ class MoLM(PreTrainedModel):
                 # Expand the expert_mask to match the logits shape (batch_size, 1, 1)
                 expert_mask_expanded = expert_mask.unsqueeze(-1).unsqueeze(-1).float()
-                expert_output = expert(input_ids, targets=targets, date=date, get_logits=True, **kwargs)
                 logits = expert_output["logits"]
                 loss_to_log = expert_output["loss_to_log"]
@@ -234,10 +234,10 @@ class MoLM(PreTrainedModel):
     def generate_from_string(self, in_str, max_new_tokens, date=None, temperature=1.0, top_k=None):
         idx = (
             torch.tensor(
-                self.tokenizer.encode(in_str, allowed_special={"<|endoftext|>"})
             )
             .view(1, -1)
-            .to(self.lm_head.weight.device)
         )
         out_idx = (
             self.generate(idx, max_new_tokens, date, temperature, top_k)

                 # Expand the expert_mask to match the logits shape (batch_size, 1, 1)
                 expert_mask_expanded = expert_mask.unsqueeze(-1).unsqueeze(-1).float()
+                expert_output = expert(input_ids, targets=targets, date=date, **kwargs)
                 logits = expert_output["logits"]
                 loss_to_log = expert_output["loss_to_log"]
     def generate_from_string(self, in_str, max_new_tokens, date=None, temperature=1.0, top_k=None):
         idx = (
             torch.tensor(
+                self.tokenizer.encode(in_str)
             )
             .view(1, -1)
+            .to(next(self.parameters()).device)
         )
         out_idx = (
             self.generate(idx, max_new_tokens, date, temperature, top_k)