boltuix
/

EntityBERT

Model card Files Files and versions

boltuix commited on Jun 10, 2025

Commit

7d47c04

·

verified ·

1 Parent(s): 2ed5136

Update README.md

Files changed (1) hide show

README.md +17 -4

README.md CHANGED Viewed

@@ -103,23 +103,36 @@ Use the model for NER with the following Python code:
 ```python
 from transformers import AutoTokenizer, AutoModelForTokenClassification, pipeline
 # Load model and tokenizer
 tokenizer = AutoTokenizer.from_pretrained("boltuix/EntityBERT")
 model = AutoModelForTokenClassification.from_pretrained("boltuix/EntityBERT")
-# Create NER pipeline
 nlp = pipeline("token-classification", model=model, tokenizer=tokenizer, aggregation_strategy="simple")
 # Input text
-text = "Dr. Sarah Lee at Johns Hopkins, Baltimore, MD, books a flight to Rochester, MN on July 10, 2025, contact +1-410-955-5000 or sarah.lee@jhmi.edu, visit www.airmed.com."
 # Run inference
 ner_results = nlp(text)
-# Print results
 for entity in ner_results:
-    print(f"{entity['word']:15} -> {entity['entity']}")
 ```
 ### ✨ Example Output

 ```python
 from transformers import AutoTokenizer, AutoModelForTokenClassification, pipeline
+import json
+from collections import defaultdict
 # Load model and tokenizer
 tokenizer = AutoTokenizer.from_pretrained("boltuix/EntityBERT")
 model = AutoModelForTokenClassification.from_pretrained("boltuix/EntityBERT")
+# Create NER pipeline with aggregation
 nlp = pipeline("token-classification", model=model, tokenizer=tokenizer, aggregation_strategy="simple")
 # Input text
+text = (
+    "Plan a trip to Miami from Orlando"
+)
 # Run inference
 ner_results = nlp(text)
+# Organize into dictionary by entity_group
+entities = defaultdict(list)
 for entity in ner_results:
+    group = entity["entity_group"]
+    word = entity["word"]
+    entities[group].append(word)
+# Format results into final JSON structure
+formatted_output = {k: " ".join(v) for k, v in entities.items()}
+# Pretty-print as JSON
+print(json.dumps(formatted_output, indent=2))
 ```
 ### ✨ Example Output