Locutusque
/

gpt2-medium-conversational

Text Generation

text-generation-inference

Model card Files Files and versions

Locutusque commited on May 20, 2023

Commit

2bfe150

·

1 Parent(s): 7355cf2

Update README.md

Files changed (1) hide show

README.md +5 -5

README.md CHANGED Viewed

@@ -42,7 +42,8 @@ This model is not suitable for all use cases due to its limited training time on
 ```python
 import torch
 from transformers import GPT2Tokenizer, GPT2LMHeadModel
 tokenizer = GPT2Tokenizer.from_pretrained('gpt2-medium')
 model = GPT2LMHeadModel.from_pretrained('gpt2-medium')
 tokenizer.add_special_tokens({'pad_token': '[PAD]'})
@@ -68,9 +69,6 @@ def generate_text(model, tokenizer, prompt, max_length=256):
                             eos_token_id=tokenizer.eos_token_id,
                             attention_mask=attention_mask)
     output_ids = tokenizer.decode(output[0], skip_special_tokens=False)
-    assistant_token_index = output_ids.index('<|ASSISTANT|>') + len('<|ASSISTANT|>')
-    next_token_index = output_ids.find('<|', assistant_token_index)
-    output_ids = output_ids[assistant_token_index:next_token_index]
     return output_ids
 # Loop to interact with the model
 while True:
@@ -78,7 +76,9 @@ while True:
     if prompt == "q":
         break
     output_text = generate_text(model, tokenizer, prompt)
-    print(output_text)
 ```
 ## Deploying and training the model
 The model has been fine-tuned on a specific input format that goes like this ```"<|USER|> {user prompt} <|ASSISTANT|> {model prediction} <|End|>".``` For the best performance from the model the input text should be as follows ```<|USER|> {dataset prompt} <|ASSISTANT|> ``` and the target/label should be as follows ```<|USER|> {dataset prompt} <|ASSISTANT|> {dataset output} <|End|>```

 ```python
 import torch
 from transformers import GPT2Tokenizer, GPT2LMHeadModel
+start_token = "<|ASSISTANT|>"
+end_token = "<|"
 tokenizer = GPT2Tokenizer.from_pretrained('gpt2-medium')
 model = GPT2LMHeadModel.from_pretrained('gpt2-medium')
 tokenizer.add_special_tokens({'pad_token': '[PAD]'})
                             eos_token_id=tokenizer.eos_token_id,
                             attention_mask=attention_mask)
     output_ids = tokenizer.decode(output[0], skip_special_tokens=False)
     return output_ids
 # Loop to interact with the model
 while True:
     if prompt == "q":
         break
     output_text = generate_text(model, tokenizer, prompt)
+    text_between_tokens = output_text[output_text.find(start_token) + len(start_token):]
+    out = text_between_tokens[:text_between_tokens.find(end_token)]
+    print(out)
 ```
 ## Deploying and training the model
 The model has been fine-tuned on a specific input format that goes like this ```"<|USER|> {user prompt} <|ASSISTANT|> {model prediction} <|End|>".``` For the best performance from the model the input text should be as follows ```<|USER|> {dataset prompt} <|ASSISTANT|> ``` and the target/label should be as follows ```<|USER|> {dataset prompt} <|ASSISTANT|> {dataset output} <|End|>```