saracandu
/

stldec_random_16_large

Text Generation

Model card Files Files and versions

saracandu commited on Aug 21, 2025

Commit

886c8fb

·

verified ·

1 Parent(s): 75bfa8f

Upload tokenizer

Files changed (1) hide show

tokenizer.py +3 -5

tokenizer.py CHANGED Viewed

@@ -1,9 +1,10 @@
 import re
 import os
-import json
 from typing import Any, Dict, List, Optional, Tuple, Union
 from transformers import PreTrainedTokenizer
 from transformers.utils import logging
 logger = logging.get_logger(__name__)
@@ -17,10 +18,7 @@ def load_json(path: str) -> Union[Dict, List]:
     Returns:
         Union[Dict, List]: The parsed content of the JSON file, which could be a dictionary or a list.
     """
-    full_path = path
-    if not os.path.exists(full_path):
-        # carica relativo alla posizione del file tokenizer.py
-        full_path = os.path.join(os.path.dirname(__file__), path)
     with open(full_path, "r", encoding="utf-8") as f:
         return json.load(f)

 import re
 import os
 from typing import Any, Dict, List, Optional, Tuple, Union
 from transformers import PreTrainedTokenizer
 from transformers.utils import logging
+from pathlib import Path
+import json
 logger = logging.get_logger(__name__)
     Returns:
         Union[Dict, List]: The parsed content of the JSON file, which could be a dictionary or a list.
     """
+    full_path = Path(__file__).parent / path
     with open(full_path, "r", encoding="utf-8") as f:
         return json.load(f)