Spaces:

kwkintervu
/

intervu

Runtime error

App Files Files Community

intervu / app.py

maahikachitagi

Update app.py

980eae5 verified 7 months ago

raw

history blame contribute delete

9.65 kB

	# --- IMPORTS ---
	import gradio as gr
	from huggingface_hub import InferenceClient
	import re
	import random
	import whisper
	from pydub import AudioSegment
	import torch
	import torchvision.transforms as transforms
	import torchvision.models as models
	from PIL import Image

	# --- LOAD MODELS ---

	# HuggingFace Zephyr Model for Chat
	client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")

	# Whisper Model for Audio-to-Text
	whisper_model = whisper.load_model("base")

	# ResNet18 Model for Posture Classification
	model = models.resnet18(weights=models.ResNet18_Weights.IMAGENET1K_V1)
	model.fc = torch.nn.Linear(model.fc.in_features, 2)
	model.eval()

	transform = transforms.Compose([
	transforms.Resize((224, 224)),
	transforms.ToTensor()
	])

	# --- LOAD QUESTIONS ---
	def load_questions(file_path):
	with open(file_path, 'r') as f:
	data = f.read()
	question_blocks = re.split(r'Question:\s*', data)[1:]
	questions = []
	for block in question_blocks:
	parts = block.split('Possible Answers:')
	question_text = parts[0].strip()
	answers_text = parts[1].strip()
	possible_answers = [ans.strip() for ans in re.split(r'\d+\.\s+', answers_text) if ans.strip()]
	questions.append({'question': question_text, 'answers': possible_answers})
	return questions

	all_questions = load_questions('knowledge.txt')

	questions_by_type = {
	'Technical': [q for q in all_questions if any(keyword in q['question'].lower() for keyword in [
	'function', 'linked list', 'url', 'rest', 'graphql', 'garbage', 'cap theorem', 'sql', 'hash table',
	'stack', 'queue', 'recursion', 'reverse', 'bfs', 'dfs', 'time complexity', 'binary search tree',
	'web application', 'chat system', 'load balancing', 'caching', 'normalization', 'acid', 'indexing',
	'sql injection', 'https', 'xss', 'hash', 'vulnerabilities'])],
	'Competency-Based Interview': [q for q in all_questions if any(keyword in q['question'].lower() for keyword in [
	"debugging", "learning", "deadlines", "teamwork", "leadership", "mistake", "conflict", "decision"])],
	'Case': [q for q in all_questions if any(keyword in q['question'].lower() for keyword in [
	"testing", "financial", "automation", "analysis", "regression", "business", "stakeholder"])]
	}

	# --- AUDIO TRANSCRIPTION ---
	def transcribe_audio(file_path):
	try:
	audio = AudioSegment.from_file(file_path)
	converted_path = "converted.wav"
	audio.export(converted_path, format="wav")
	result = whisper_model.transcribe(converted_path, fp16=False)
	return result["text"]
	except Exception as e:
	return f"❌ ERROR: {str(e)}"

	# --- POSTURE CLASSIFICATION ---
	def classify_image(image):
	if image is None:
	return "No image provided! Please upload or capture an image."
	image = transform(image).unsqueeze(0)
	output = model(image)
	_, predicted = torch.max(output, 1)
	return (
	"✅ Good Posture! Sit exactly like that for your Interview!"
	if predicted.item() == 0
	else "⚠️ Bad Posture — try sitting straighter or more centered for your real interview."
	)

	# --- INTERVIEW LOGIC ---

	def set_type(choice, user_profile):
	user_profile["interview_type"] = choice
	return "Great! What’s your background and what field/role are you aiming for?", user_profile

	def save_background(info, user_profile):
	user_profile["field"] = info
	return "Awesome! Type 'start' below to begin your interview.", user_profile

	def respond(message, chat_history, user_profile):
	message_lower = message.strip().lower()

	if not user_profile.get("interview_type") or not user_profile.get("field"):
	bot_msg = "Please finish steps 1 and 2 before starting the interview."
	chat_history.append((message, bot_msg))
	return chat_history

	if message_lower == 'start':
	interview_type = user_profile['interview_type']
	selected_questions = questions_by_type.get(interview_type, [])
	random.shuffle(selected_questions)
	selected_questions = selected_questions[:10]

	user_profile['questions'] = selected_questions
	user_profile['current_q'] = 0
	user_profile['user_answers'] = []
	user_profile['interview_in_progress'] = True

	intro = f"Welcome to your {interview_type} interview for a {user_profile['field']} position. I will ask you up to 10 questions. Type 'stop' anytime to end."
	first_q = f"First question: {selected_questions[0]['question']}"
	chat_history.append((message, intro))
	chat_history.append(("", first_q))
	return chat_history

	if message_lower == 'stop' and user_profile.get("interview_in_progress"):
	user_profile['interview_in_progress'] = False
	bot_msg = "Interview stopped. Type 'feedback' if you'd like me to analyze your answers. Thanks for interviewing with Intervu!"
	chat_history.append((message, bot_msg))
	return chat_history

	if user_profile.get("interview_in_progress"):
	q_index = user_profile['current_q']
	user_profile['user_answers'].append(message)

	q_index += 1
	user_profile['current_q'] = q_index

	if q_index < len(user_profile['questions']):
	bot_msg = f"Next question: {user_profile['questions'][q_index]['question']}"
	else:
	user_profile['interview_in_progress'] = False
	bot_msg = "Interview complete! Type 'feedback' if you'd like me to analyze your answers. Thanks for interviewing with Intervu!"
	chat_history.append((message, bot_msg))
	return chat_history

	if message_lower == 'feedback':
	feedback = generate_feedback(user_profile)
	chat_history.append((message, feedback))
	return chat_history

	messages = [{"role": "system", "content": f"You are a professional interviewer conducting a {user_profile['interview_type']} interview for a candidate in {user_profile['field']}."}]
	for q, a in chat_history:
	messages.append({"role": "user", "content": q})
	messages.append({"role": "assistant", "content": a})
	messages.append({"role": "user", "content": message})

	response = client.chat_completion(messages, max_tokens=150, stream=False)
	bot_msg = response.choices[0].message.content
	chat_history.append((message, bot_msg))
	return chat_history

	def generate_feedback(user_profile):
	feedback = []
	questions = user_profile.get('questions', [])
	answers = user_profile.get('user_answers', [])
	for i, user_ans in enumerate(answers):
	correct_answers = questions[i]['answers']
	match = any(ans.lower() in user_ans.lower() for ans in correct_answers)
	if match:
	fb = f"Question {i+1}: ✅ Good job!"
	else:
	fb = f"Question {i+1}: ❌ Missed key points: {correct_answers[0]}"
	feedback.append(fb)
	return "\n".join(feedback)

	# AUDIO HANDLING
	def handle_audio(audio_file, chat_history, user_profile):
	transcribed = transcribe_audio(audio_file)
	if transcribed.startswith("❌"):
	chat_history.append(("Audio input", transcribed))
	return chat_history
	return respond(transcribed, chat_history, user_profile)

	# --- GRADIO INTERFACE ---

	with gr.Blocks() as demo:
	user_profile = gr.State({"interview_type": "", "field": "", "interview_in_progress": False})
	chat_history = gr.State([])

	gr.Markdown("# 🎤 Welcome to Intervu")
	gr.Image(value="images.JPEG", show_label=False, width=200)

	gr.Markdown("### Step 1: Choose Interview Type")
	with gr.Row():
	with gr.Column():
	btn1 = gr.Button("Technical")
	btn2 = gr.Button("Competency-Based Interview")
	btn3 = gr.Button("Case")
	type_output = gr.Textbox(label="Bot response", interactive=False)

	btn1.click(set_type, inputs=[gr.Textbox(value="Technical", visible=False), user_profile], outputs=[type_output, user_profile])
	btn2.click(set_type, inputs=[gr.Textbox(value="Competency-Based Interview", visible=False), user_profile], outputs=[type_output, user_profile])
	btn3.click(set_type, inputs=[gr.Textbox(value="Case", visible=False), user_profile], outputs=[type_output, user_profile])

	gr.Markdown("### Step 2: Enter Your Background")
	background = gr.Textbox(label="Your background and field/goal")
	background_btn = gr.Button("Submit")
	background_output = gr.Textbox(label="Bot response", interactive=False)
	background_btn.click(save_background, inputs=[background, user_profile], outputs=[background_output, user_profile])

	gr.Markdown("### Step 3: Start Interview")
	chatbot = gr.Chatbot(label="Interview Bot", type="messages")
	with gr.Row():
	msg = gr.Textbox(label="Your message")
	audio_input = gr.Audio(type="filepath", label="🎙️ Upload or Record your answer")
	with gr.Row():
	send_btn = gr.Button("Send Text")
	audio_btn = gr.Button("Send Audio")
	send_btn.click(respond, inputs=[msg, chat_history, user_profile], outputs=[chatbot], queue=False)
	send_btn.click(lambda: "", None, msg, queue=False)
	audio_btn.click(handle_audio, inputs=[audio_input, chat_history, user_profile], outputs=[chatbot], queue=False)

	# ✅ Step 4: Webcam Posture Check
	gr.Markdown("### Step 4: Webcam Posture Check")
	webcam = gr.Image(source="webcam", label="Capture Posture")

	posture_output = gr.Textbox(label="Posture Feedback")
	posture_btn = gr.Button("Analyze Posture")
	posture_btn.click(classify_image, inputs=[webcam], outputs=[posture_output])

	# LAUNCH
	demo.launch()