from transformers import AutoTokenizer tok = AutoTokenizer.from_pretrained(".") print(tok.tokenize("Hello world! write code ")) text = "Hello world! write code " ids = tok.encode(text) print(ids) print(tok.decode(ids)) print(tok.decode(ids, skip_special_tokens=True))