michaelbzhu commited on
Commit
b07a847
·
verified ·
1 Parent(s): d3a2364

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +18 -0
README.md CHANGED
@@ -25,4 +25,22 @@ Model config:
25
  "n_heads": 64,
26
  "n_layers": 3,
27
  "n_vocab": 50257
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  ```
 
25
  "n_heads": 64,
26
  "n_layers": 3,
27
  "n_vocab": 50257
28
+ ```
29
+
30
+ Usage:
31
+ ```
32
+ from transformers import AutoTokenizer, AutoModelForCausalLM
33
+ import torch
34
+
35
+ model = AutoModelForCausalLM.from_pretrained("michaelbzhu/test-3.2B-base", trust_remote_code=True)
36
+ model = model.cuda()
37
+ tokenizer = AutoTokenizer.from_pretrained("michaelbzhu/test-3.2B-base", trust_remote_code=True)
38
+
39
+ prompt = "The future of AI is"
40
+ input_ids = tokenizer.encode(prompt, return_tensors="pt").to(model.device)
41
+ for _ in range(20):
42
+ logits = model(input_ids).logits[0, -1, :]
43
+ next_token = torch.multinomial(torch.softmax(logits, dim=-1), 1).unsqueeze(0)
44
+ input_ids = torch.cat([input_ids, next_token], dim=1)
45
+ print(tokenizer.decode(input_ids[0]))
46
  ```