taylorj94
/

Llama-3.2-1B

Text Generation

text-generation-inference

Model card Files Files and versions

taylorj94 commited on Dec 27, 2024

Commit

b3ebb95

·

verified ·

1 Parent(s): 53c6e74

Update handler.py

Files changed (1) hide show

handler.py +9 -6

handler.py CHANGED Viewed

@@ -18,15 +18,18 @@ class EndpointHandler:
     def get_allowed_token_ids(self, vocab_list: List[str]) -> set[int]:
         """
         Generate a set of token IDs for a given list of allowed words.
-        Includes both plain and space-prefixed forms of each word.
         """
         allowed_ids = set()
         for word in vocab_list:
-            # Add plain and space-prefixed token IDs
-            for token_id in self.tokenizer.encode(word, add_special_tokens=False):
-                allowed_ids.add(token_id)
-            for token_id in self.tokenizer.encode(" " + word, add_special_tokens=False):
-                allowed_ids.add(token_id)
         return allowed_ids
     def filter_allowed_tokens(self, input_ids: torch.Tensor, scores: np.ndarray, allowed_token_ids: set[int]) -> np.ndarray:

     def get_allowed_token_ids(self, vocab_list: List[str]) -> set[int]:
         """
         Generate a set of token IDs for a given list of allowed words.
+        Includes plain, space-prefixed, capitalized, and uppercase forms of each word.
         """
         allowed_ids = set()
         for word in vocab_list:
+            # Generate all variations: plain, space-prefixed, capitalized, and uppercase
+            variations = {word, " " + word, word.capitalize(), " " + word.capitalize(), word.upper(), " " + word.upper()}
+            # Add token IDs for all variations
+            for variation in variations:
+                for token_id in self.tokenizer.encode(variation, add_special_tokens=False):
+                    allowed_ids.add(token_id)
         return allowed_ids
     def filter_allowed_tokens(self, input_ids: torch.Tensor, scores: np.ndarray, allowed_token_ids: set[int]) -> np.ndarray: