Spaces:

histlearn
/

communitynotesbr

Running

histlearn commited on Apr 24

Commit

2dd975b

verified ·

1 Parent(s): a2ad1d2

fix: cast emb ao dtype da head (corrige F.linear em CPU sem autocast)

Files changed (1) hide show

inference.py CHANGED Viewed

@@ -181,7 +181,9 @@ def predict_batch(
             out = encoder(**toks)
             emb = last_token_pool(out.last_hidden_state, toks["attention_mask"])
             emb = F.normalize(emb, p=2, dim=1)
-            logits = head(emb).squeeze(-1)
             p = torch.sigmoid(logits).float().cpu().numpy()
         preds.append(p)

             out = encoder(**toks)
             emb = last_token_pool(out.last_hidden_state, toks["attention_mask"])
             emb = F.normalize(emb, p=2, dim=1)
+            # Em CPU sem autocast, o encoder sai em fp16 e a head permanece em fp32 →
+            # F.linear recusa. Igualar ao dtype da head resolve (inofensivo em GPU).
+            logits = head(emb.to(head.weight.dtype)).squeeze(-1)
             p = torch.sigmoid(logits).float().cpu().numpy()
         preds.append(p)