Spaces:

mingbaer
/

CapstoneProject

Runtime error

App Files Files Community

CapstoneProject / app.py

mingbaer

debug syntax

c1d3cbc verified 12 months ago

raw

history blame

2.51 kB

	# FRONTEND: Python library that makes it super easy to build simple user interfaces (UIs)
	import gradio as gr
	# BACKEND: tool from Hugging Face library to send messages to AI models and get answers back
	from huggingface_hub import InferenceClient
	# Helpful commentary from ChatGPT:
	# Gradio is the face and mouth — it lets people talk to the robot.
	# InferenceClient is the brain connector — it lets your robot talk to a super-smart brain (the Hugging Face model) and get answers.
	from sentence_transformers import SentenceTransformer
	# a Python library that allows you to turn sentences into numerical vector embeddings
	import torch
	# a machine learning library that that performs cosine similarity calculations
	import numpy as np

	# upload knowledge base - from sentiment analysis lab
	with open("essay_writing.txt", "r", encoding="utf-8") as f:
	essay_writing = f.read()

	# split the text into chunks
	cleaned_chunks = [chunk.strip() for chunk in essay_writing.split("\n\n") if chunk.strip()]

	# load an embedding model
	model = SentenceTransformer('all-MiniLM-L6-v2')

	chunk_embeddings = model.encode(cleaned_chunks, convert_to_tensor=True)

	def pull_relevant_info(query, top_k=3):
	query_embedding = model.encode(query, convert_to_tensor=True)
	query_embedding_normalized = query_embedding / query_embedding.norm()

	chunk_embeddings_normalized = chunk_embeddings / chunk_embeddings.norm(dim=1, keepdim=True)

	similarities = torch.matmul(chunk_embeddings_normalized, query_embedding_normalized)

	top_indices = torch.topk(similarities, k=top_k).indices.cpu().numpy()

	relevant_info = "\n\n".join([cleaned_chunks[i] for i in top_indices])

	return relevant_info

	client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")

	def respond(message, history):

	info = pull_relevant_info(message, top_k=3)
	system_message = (f"You are a friendly chatbot. Use the following information to help answer the user's question:\n{info}\n")
	messages = [{"role": "system", "content": system_message}]

	if history:
	messages.extend(history)

	messages.append({"role": "user", "content": message})

	response = ""

	for message_chunk in client.chat_completion(
	messages,
	max_tokens=100,
	stream=True
	):
	token = message_chunk['choices'][0]['delta'].get('content', '')
	respond += token

	yield response


	chatbot = gr.ChatInterface(respond, type="messages")

	chatbot.launch()