orlandopozo commited on
Commit
78c0171
·
verified ·
1 Parent(s): 193480f

gpt2 pre-trained model with streamlit data app framework

Browse files
Files changed (1) hide show
  1. app.py +31 -0
app.py ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ from transformers import GPT2LMHeadModel, GPT2Tokenizer
3
+
4
+ # Load the pre-trained GPT-2 model and tokenizer
5
+ model_name = "gpt2"
6
+ tokenizer = GPT2Tokenizer.from_pretrained(model_name)
7
+ model = GPT2LMHeadModel.from_pretrained(model_name)
8
+
9
+ # Define a text prompt
10
+ prompt = st.text_area('Enter the prompt!')
11
+
12
+ # Encode the prompt text and convert to tensor
13
+ if prompt:
14
+ input_ids = tokenizer.encode(prompt, return_tensors='pt')
15
+
16
+ # Generate text using the GPT-2 model
17
+ output = model.generate(
18
+ input_ids,
19
+ max_length=100, # Maximum length of the generated text
20
+ num_return_sequences=1, # Number of sequences to generate
21
+ no_repeat_ngram_size=2, # Avoid repeating n-grams
22
+ top_k=50, # Top-K sampling
23
+ top_p=0.95, # Top-p (nucleus) sampling
24
+ temperature=0.7 # Sampling temperature
25
+ )
26
+
27
+ # Decode the generated text to string
28
+ generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
29
+
30
+ # Print the generated text
31
+ st.write(generated_text)