YongganFu commited on
Commit
6fd2f7d
·
verified ·
1 Parent(s): d6895e6

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -32,7 +32,7 @@ model = model.cuda().to(torch.bfloat16)
32
  user_input = input("User: ").strip()
33
 
34
  prompt_ids = tokenizer(user_input,return_tensors='pt').input_ids.to(device='cuda')
35
- out_ids, nfe = model.generate(prompt_ids, max_new_tokens=128, steps=128, block_length=32, threshold=0.9)
36
 
37
  tokenized_out = tokenizer.batch_decode(out_ids[:, prompt_ids.shape[1]:], skip_special_tokens=True)[0]
38
  print(f"Model: {tokenized_out}")
 
32
  user_input = input("User: ").strip()
33
 
34
  prompt_ids = tokenizer(user_input,return_tensors='pt').input_ids.to(device='cuda')
35
+ out_ids, nfe = model.generate(prompt_ids, max_new_tokens=128, steps=128, block_length=32, shift_logits=False, threshold=0.9)
36
 
37
  tokenized_out = tokenizer.batch_decode(out_ids[:, prompt_ids.shape[1]:], skip_special_tokens=True)[0]
38
  print(f"Model: {tokenized_out}")