Spaces:

HSinghHuggingFace
/

gpt-text-generator

Build error

App Files Files Community

gpt-text-generator / app.py

HSinghHuggingFace

use trained model with loss less than 0.01%

123ad3b about 1 year ago

raw

history blame contribute delete

3.98 kB

	import streamlit as st
	import torch
	import tiktoken
	import sys
	import os
	import logging
	import warnings

	# Configure logging and warnings
	logging.getLogger('streamlit').setLevel(logging.ERROR)
	warnings.filterwarnings('ignore', message='.torch.classes.')
	warnings.filterwarnings('ignore', category=FutureWarning)

	# Add the project root to Python path
	sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))

	from src.config.model_config import GPTConfig
	from src.models.gpt import GPT
	from src.utils.device_utils import get_device

	@st.cache_resource
	def load_model():
	device = get_device()
	config = GPTConfig()
	model = GPT(config)

	# Load the trained weights from root directory
	checkpoint = torch.load('model.pt', map_location=device, weights_only=True)

	# Handle pruned weights
	state_dict = checkpoint['model_state_dict']
	new_state_dict = {}

	for key in model.state_dict().keys():
	if key.endswith('.weight'):
	# Check if this is a pruned weight
	orig_key = key[:-7] + '.weight_orig' if key.endswith('.weight') else key
	mask_key = key[:-7] + '.weight_mask' if key.endswith('.weight') else key

	if orig_key in state_dict and mask_key in state_dict:
	# Reconstruct the pruned weight
	new_state_dict[key] = state_dict[orig_key] * state_dict[mask_key]
	else:
	# Use the weight as is
	new_state_dict[key] = state_dict[key] if key in state_dict else model.state_dict()[key]
	else:
	# Copy non-weight parameters as is
	new_state_dict[key] = state_dict[key] if key in state_dict else model.state_dict()[key]

	# Load the processed state dict
	model.load_state_dict(new_state_dict)

	# Convert back to float32 for inference
	model = model.float()
	model.to(device)
	model.eval()

	return model, device

	def generate_text(model, prompt, max_length=100, num_return_sequences=1, device='cpu'):
	tokenizer = tiktoken.get_encoding('gpt2')
	input_tokens = tokenizer.encode(prompt)
	x = torch.tensor(input_tokens).unsqueeze(0).repeat(num_return_sequences, 1)
	x = x.to(device)

	# Calculate final length (input length + requested additional tokens)
	input_length = x.size(1)
	target_length = input_length + max_length

	# Generate text
	with torch.no_grad():
	while x.size(1) < target_length:
	logits = model(x)[0]
	next_token_logits = logits[:, -1, :]
	probs = torch.softmax(next_token_logits, dim=-1)
	next_token = torch.multinomial(probs, num_samples=1)
	x = torch.cat((x, next_token), dim=1)

	# Print token information once before generating sequences
	st.text(f"Size of Input tokens: {input_length}, Additional tokens to be predicted: {max_length}, Total tokens to be generated: {x.size(1)}")

	# Decode generated sequences
	generated_texts = []
	for i in range(num_return_sequences):
	tokens = x[i].tolist()
	text = tokenizer.decode(tokens)
	generated_texts.append(text)

	return generated_texts

	# Streamlit UI
	st.title("GPT Text Generator")

	# Load model
	model, device = load_model()

	# Input form
	prompt = st.text_area("Enter your prompt:", "Once upon a time")
	max_length = st.slider("Predict additional text of length:", min_value=1, max_value=50, value=5)
	num_sequences = st.slider("Number of sequences to generate:", 1, 5, 1)

	if st.button("Generate"):
	with st.spinner("Generating text..."):
	generated_texts = generate_text(
	model=model,
	prompt=prompt,
	max_length=max_length,
	num_return_sequences=num_sequences,
	device=device
	)

	# Display results
	for i, text in enumerate(generated_texts, 1):
	st.write(f"\nSequence {i}:")
	st.write(text)