Ryan Kingery commited on
Commit
2db9276
·
1 Parent(s): 161b3ed

Update utils.py

Browse files
Files changed (1) hide show
  1. utils.py +4 -1
utils.py CHANGED
@@ -46,7 +46,10 @@ def clean_text(tokens):
46
  text.append(token)
47
  prev_token = token
48
  detokenizer = TreebankWordDetokenizer()
49
- return detokenizer.detokenize(text).replace("' ", "'").replace(" . ", ". ").replace(" ? ", "? ").replace(" ! ", "! ")
 
 
 
50
 
51
  def generate_text(seed, model, vocab, max_len=20, temperature=1., device=device, skip_tokens=['<unk>'], top_k=50):
52
  stoi, itos = vocab.get_stoi(), vocab.get_itos()
 
46
  text.append(token)
47
  prev_token = token
48
  detokenizer = TreebankWordDetokenizer()
49
+ text = detokenizer.detokenize(text)
50
+ text = text.replace(" ' ", "' ").replace("' ", "'")
51
+ text = text.replace(" . . . ", "...").replace(" . ", ". ").replace(" ? ", "? ").replace(" ! ", "! ")
52
+ return text
53
 
54
  def generate_text(seed, model, vocab, max_len=20, temperature=1., device=device, skip_tokens=['<unk>'], top_k=50):
55
  stoi, itos = vocab.get_stoi(), vocab.get_itos()