File size: 434 Bytes
31c0ef2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18

import sys
import torch
from transformers import AutoTokenizer

input_ids=[32, 720, 103, 432, 146, 167, 1400, 195, 294, 1083, 111]
input_ids=[1,  88,  64, 779,   2,  64,   1,  89,  64]
model = "/sgl-workspace/guppylm-9M"
tokenizer = AutoTokenizer.from_pretrained(
    model,
    trust_remote_code=True,
)
text = tokenizer.decode(
    torch.tensor(input_ids, dtype=torch.long),
    skip_special_tokens=False,
)
sys.stdout.write(text)