Spaces:

indiapuig
/

first_bot

Sleeping

App Files Files Community

first_bot / app.py

indiapuig

Update app.py

64d98fa verified 5 months ago

raw

history blame contribute delete

4.1 kB

	import gradio as gr
	from huggingface_hub import InferenceClient
	import torch
	from sentence_transformers import SentenceTransformer

	# Initialize the model client
	client = InferenceClient("microsoft/phi-4")

	# Load biology specification text
	with open("bio_spec.txt", "r", encoding="utf-8", errors="replace") as f:
	bio_spec_text = f.read()

	# Preprocess text into chunks
	def preprocess_text(text):
	return [chunk.strip() for chunk in text.strip().split("\n") if chunk.strip()]

	bio_chunks = preprocess_text(bio_spec_text)

	# Load sentence transformer model and encode chunks
	embedding_model = SentenceTransformer("all-MiniLM-L6-v2")
	chunk_embeddings = embedding_model.encode(bio_chunks, convert_to_tensor=True)

	# Retrieve the most relevant chunks
	def get_top_chunks(query, chunk_embeddings, text_chunks, top_k=3):
	query_embedding = embedding_model.encode(query, convert_to_tensor=True)
	query_norm = torch.nn.functional.normalize(query_embedding, p=2, dim=0)
	chunks_norm = torch.nn.functional.normalize(chunk_embeddings, p=2, dim=1)
	similarities = torch.matmul(chunks_norm, query_norm)
	top_indices = torch.topk(similarities, k=top_k).indices
	return [text_chunks[i] for i in top_indices]

	# Global state
	chosen_topic = None
	chosen_mode = None

	# Gradio callbacks
	def set_topic(topic):
	global chosen_topic
	chosen_topic = topic
	return f"✅ Great! You've chosen {topic}."

	def set_mode(mode):
	global chosen_mode
	chosen_mode = mode
	return f"✅ You have selected {mode} mode."

	# Generate system prompt based on mode
	def get_system_prompt():
	global chosen_mode, chosen_topic
	if not chosen_topic or not chosen_mode:
	return "Please select both a topic and a mode to start."

	relevant_chunks = get_top_chunks(chosen_topic, chunk_embeddings, bio_chunks, top_k=4)
	spec_content = "\n".join(relevant_chunks)

	if chosen_mode == "exam mode":
	prompt = (
	f"You are now asking GCSE Biology exam-style questions on the topic '{chosen_topic}'. "
	f"Ask one question at a time. Wait for the user to answer before giving feedback or asking the next question. "
	f"Use the following specification excerpts as reference:\n{spec_content}"
	)
	else:
	prompt = (
	f"You are a helpful science tutor teaching '{chosen_topic}' in small, digestible sections. "
	f"Focus on clear explanations suitable for 14-16 year olds. "
	f"Use the following specification excerpts as reference:\n{spec_content}"
	)
	return prompt

	# Chatbot response
	def respond(message, history):
	system_prompt = get_system_prompt()
	if "Please select both" in system_prompt:
	return system_prompt # Early return if topic or mode not selected

	messages = [{"role": "system", "content": system_prompt}]
	if history:
	messages.extend(history)
	messages.append({"role": "user", "content": message})

	response = client.chat_completion(messages, max_tokens=300)
	return response['choices'][0]['message']['content'].strip()

	# Topic and mode lists
	BIO_TOPICS = [
	"Cell Biology",
	"Organisation",
	"Infection and Response",
	"Bioenergetics",
	"Homeostasis and Response",
	"Inheritance, Variation and Evolution",
	"Ecology"
	]
	exam_mode = ["exam mode", "learning mode"]

	# Gradio interface
	with gr.Blocks() as demo:
	gr.Markdown("# ACE it! 📚 — GCSE Biology Tutor")

	with gr.Row():
	topic_dropdown = gr.Dropdown(choices=BIO_TOPICS, label="Choose a Biology Topic")
	topic_button = gr.Button("Confirm Topic")
	topic_output = gr.Markdown()

	with gr.Row():
	exam_dropdown = gr.Dropdown(choices=exam_mode, label="Which mode would you like")
	exam_button = gr.Button("Confirm mode")
	exam_output = gr.Markdown()

	chatbot = gr.ChatInterface(respond, type="messages", title="ACE it!")

	topic_button.click(set_topic, inputs=topic_dropdown, outputs=topic_output)
	exam_button.click(set_mode, inputs=exam_dropdown, outputs=exam_output)




	demo.launch()