heyongxin233
/

DETree

Feature Extraction

text-embeddings-inference

Model card Files Files and versions

heyongxin233 commited on Oct 29, 2025

Commit

7b303af

·

verified ·

1 Parent(s): 9e0a7dc

Update README.md

Files changed (1) hide show

README.md +13 -7

README.md CHANGED Viewed

@@ -20,19 +20,25 @@ import torch
 from transformers import AutoTokenizer, AutoModel
 model_id = "heyongxin233/DETree"
-tgt_layer = 18                  # 0 = embeddings; 1..24 = encoder layers (RoBERTa-large)
 tok = AutoTokenizer.from_pretrained(model_id)
-enc = AutoModel.from_pretrained(model_id, output_hidden_states=True)
 texts = ["An example sentence.", "Another one."]
 batch = tok(texts, padding=True, truncation=True, return_tensors="pt")
-with torch.no_grad():
     out = enc(**batch)
-    hs = out.hidden_states[tgt_layer]              # (bsz, seq, hidden)
-    mask = batch["attention_mask"].unsqueeze(-1)   # (bsz, seq, 1)
     hs = hs.masked_fill(~mask.bool(), float("-inf"))
-    emb, _ = hs.max(dim=1)                         # (bsz, hidden) max-pool over tokens
     emb = torch.nn.functional.normalize(emb, p=2, dim=-1)
-print(emb.shape)  # -> (batch_size, 1024)

 from transformers import AutoTokenizer, AutoModel
 model_id = "heyongxin233/DETree"
+tgt_layer = 18  # 0=embeddings; 1..24=encoder layers (RoBERTa-large)
+device = "cuda" if torch.cuda.is_available() else "cpu"
+print("Using device:", device)
 tok = AutoTokenizer.from_pretrained(model_id)
+enc = AutoModel.from_pretrained(model_id, output_hidden_states=True).to(device)
+enc.eval()
 texts = ["An example sentence.", "Another one."]
 batch = tok(texts, padding=True, truncation=True, return_tensors="pt")
+batch = {k: v.to(device) for k, v in batch.items()}
+with torch.inference_mode():
     out = enc(**batch)
+    hs = out.hidden_states[tgt_layer]            # (bsz, seq, hidden)
+    mask = batch["attention_mask"].unsqueeze(-1)  # (bsz, seq, 1)
     hs = hs.masked_fill(~mask.bool(), float("-inf"))
+    emb, _ = hs.max(dim=1)                       # max-pool over tokens
     emb = torch.nn.functional.normalize(emb, p=2, dim=-1)
+print(emb.device, emb.shape)  # -> (batch_size, 1024)
+```