Spaces:

LovnishVerma
/

MeetGeniusAI

Sleeping

App Files Files Community

MeetGeniusAI / app.py

LovnishVerma

Update app.py

0152b21 verified about 1 month ago

raw

history blame contribute delete

15.4 kB

	import os
	import re
	import uuid
	import shutil
	import threading
	import torch
	from io import BytesIO
	import numpy as np
	import subprocess # Replacing os.system for stability
	import time
	from flask import Flask, render_template, request, jsonify, send_file
	import yt_dlp
	import whisper
	from sentence_transformers import SentenceTransformer
	from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
	from docx import Document
	from reportlab.lib.pagesizes import A4
	from reportlab.pdfgen import canvas
	from reportlab.lib.utils import simpleSplit

	app = Flask(__name__)
	LOCK = threading.Lock()

	# ---- CONFIGURATION ----
	JOB_TTL_SECONDS = 30 * 60 # 30 minutes
	CLEANUP_INTERVAL = 10 * 60 # 10 minutes
	BASE_DIR = "jobs"
	os.makedirs(BASE_DIR, exist_ok=True)
	JOB_STORE = {}

	# --- DEVICE SETUP ---
	DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
	print(f"🚀 Device selected: {DEVICE}")

	if DEVICE == "cuda":
	print(f"🎮 GPU: {torch.cuda.get_device_name(0)}")
	torch.cuda.empty_cache() # Clear old cache

	# --- FFMPEG AUTO-DETECTION (FIXED) ---
	# Ye ab khud dhundega ki FFmpeg kahan install hai
	if shutil.which("ffmpeg") is None:
	print("⚠️ CRITICAL ERROR: FFmpeg is not installed or not in PATH!")
	print("👉 Please install FFmpeg from https://ffmpeg.org/download.html and add to System Variables.")
	# Fallback for Windows default path if user forgot to add to PATH
	possible_path = r"C:\ffmpeg\bin"
	if os.path.exists(possible_path):
	os.environ["PATH"] += os.pathsep + possible_path
	print(f"✅ Found FFmpeg at {possible_path}, added to path.")
	else:
	print("❌ FFmpeg not found. Audio processing will fail.")




	# --- LOAD MODELS ---
	print("⏳ Loading AI models (One-time setup)...")
	try:
	whisper_model = whisper.load_model("base", device=DEVICE)
	embedder = SentenceTransformer("all-MiniLM-L6-v2", device=DEVICE)

	qa_model_name = "google/flan-t5-base"
	tokenizer = AutoTokenizer.from_pretrained(qa_model_name)
	qa_model = AutoModelForSeq2SeqLM.from_pretrained(qa_model_name).to(DEVICE)
	print("✅ All Models loaded successfully")
	except Exception as e:
	print(f"❌ Model Loading Error: {e}")
	exit(1)

	# --- HELPER FUNCTIONS ---

	def extract_audio(input_path, output_path):
	"""
	Uses subprocess for safe execution.
	Converts video/audio to 16kHz WAV mono for Whisper.
	"""
	command = [
	"ffmpeg", "-y", "-i", input_path,
	"-ac", "1", "-ar", "16000", "-vn", output_path
	]
	# subprocess.run is safer than os.system
	try:
	subprocess.run(command, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
	except subprocess.CalledProcessError as e:
	raise Exception(f"FFmpeg conversion failed: {e}")

	def clean_sentences(text):
	text = re.sub(r'\b(\w+)( \1\b){2,}', r'\1', text, flags=re.I) # Remove repetitions
	raw = re.split(r'(?<=[.!?]) +', text)
	return [re.sub(r'\s+', ' ', s.strip()) for s in raw if len(s.split()) > 2]

	def to_paragraphs(sentences, n=4):
	return "\n\n".join(" ".join(sentences[i:i+n]) for i in range(0, len(sentences), n))

	def summarize(sentences):
	if not sentences:
	return "No content.", "No conclusion."

	# 1. Embeddings for Summary
	with torch.no_grad():
	vecs = embedder.encode(sentences, normalize_embeddings=True, batch_size=8)

	mean_vec = np.mean(vecs, axis=0)

	# FIX: Store index (i) to remember order
	# Format: (Score, Index, Sentence)
	scored_with_index = []
	for i, (s, v) in enumerate(zip(sentences, vecs)):
	score = np.dot(v, mean_vec)
	scored_with_index.append((score, i, s))

	# Step A: Pick Top 3 most important sentences
	top_3 = sorted(scored_with_index, key=lambda x: x[0], reverse=True)[:3]

	# Step B: Sort those Top 3 back by Index (Time Order)
	# Isse pehli line pehle aayegi, aur aakhri line baad mein
	top_3_chronological = sorted(top_3, key=lambda x: x[1])

	summary = " ".join(s for _, _, s in top_3_chronological)

	# 2. Abstractive Conclusion (Same as before)
	context_text = " ".join(sentences[:20])
	prompt = f"Summarize the main point of this text in one professional paragraph:\n\n{context_text}"

	input_ids = tokenizer(prompt, return_tensors="pt", max_length=512, truncation=True).input_ids.to(DEVICE)

	with torch.no_grad():
	output = qa_model.generate(input_ids, max_length=150, num_beams=4, early_stopping=True)

	conclusion = tokenizer.decode(output[0], skip_special_tokens=True)
	return summary, conclusion

	def build_vectors(job_id):
	JOB_STORE[job_id]["vectors"] = []
	chunks = JOB_STORE[job_id]["notes"].split("\n\n")
	if not chunks or chunks == ['']: return

	with torch.no_grad():
	vecs = embedder.encode(chunks, normalize_embeddings=True)

	for c, v in zip(chunks, vecs):
	JOB_STORE[job_id]["vectors"].append({"text": c, "vector": v})

	def transcribe(path):
	# Move to GPU, transcribe, then clear cache
	with torch.no_grad():
	res = whisper_model.transcribe(path, fp16=(DEVICE=="cuda"), verbose=False)

	if DEVICE == "cuda":
	torch.cuda.empty_cache() # IMPORTANT: Free up VRAM after transcription

	return " ".join(s["text"] for s in res["segments"])

	def generate_ai_answer(question, context):
	input_text = f"answer based on context: {context} question: {question}"
	input_ids = tokenizer(input_text, return_tensors="pt", max_length=512, truncation=True).input_ids.to(DEVICE)

	with torch.no_grad():
	outputs = qa_model.generate(input_ids, max_length=200, num_beams=4, early_stopping=True)

	return tokenizer.decode(outputs[0], skip_special_tokens=True)

	# --- FLASK ROUTES ---

	@app.route("/")
	def index():
	return render_template("landing.html")

	def new_job():
	# Memory Safety: Remove oldest job if > 20
	if len(JOB_STORE) >= 20:
	oldest = min(JOB_STORE.keys(), key=lambda k: JOB_STORE[k]['created_at'])
	JOB_STORE.pop(oldest)

	jid = str(uuid.uuid4())
	JOB_STORE[jid] = {
	"summary": "", "notes": "", "conclusion": "",
	"vectors": [], "created_at": time.time()
	}
	return jid

	@app.route("/dashboard", methods=["GET", "POST"])
	def dashboard():
	active_tab = request.args.get('tab', 'youtube')
	context = {}

	if request.method == "POST":
	# Changed to Blocking Lock: Wait instead of error
	with LOCK:
	job_id = new_job()
	job_dir = os.path.join(BASE_DIR, job_id)
	os.makedirs(job_dir, exist_ok=True)

	try:
	url = request.form.get("youtube_url")
	if not url: raise Exception("URL is missing")

	print(f"📥 Processing: {url}")

	ydl_opts = {
	'format': 'bestaudio/best',
	'outtmpl': os.path.join(job_dir, 'audio.%(ext)s'),
	'postprocessors': [{'key': 'FFmpegExtractAudio','preferredcodec': 'wav'}],
	'quiet': True,
	'nocheckcertificate': True, # Ignore SSL errors
	'socket_timeout': 10, # Retry quickly if stuck
	'retries': 10, # Retry more times
	}

	with yt_dlp.YoutubeDL(ydl_opts) as ydl:
	ydl.download([url])

	# Find the wav file
	audio_files = [f for f in os.listdir(job_dir) if f.endswith(".wav")]
	if not audio_files: raise Exception("Download failed, no audio file found.")
	audio_path = os.path.join(job_dir, audio_files[0])

	# Transcribe & Process
	text = transcribe(audio_path)
	sents = clean_sentences(text)
	if not sents: raise Exception("Audio transcribed but text was empty.")

	summary, conclusion = summarize(sents)
	notes = to_paragraphs(sents)

	JOB_STORE[job_id].update({"summary": summary, "notes": notes, "conclusion": conclusion})
	build_vectors(job_id)

	context = {
	"job_id": job_id, "summary": summary,
	"transcript": notes, "conclusion": conclusion
	}

	except Exception as e:
	print(f"❌ Error: {e}")
	context["error"] = f"Processing Failed: {str(e)}"
	finally:
	shutil.rmtree(job_dir, ignore_errors=True)

	return render_template("dashboard.html", active_tab=active_tab, **context)

	@app.route("/enterprise", methods=["POST"])
	def enterprise_submit():
	with LOCK: # Blocking Lock
	file = request.files.get("audio_file")
	if not file:
	return render_template("dashboard.html", active_tab="enterprise", error="No file uploaded")

	job_id = new_job()
	job_dir = os.path.join(BASE_DIR, job_id)
	os.makedirs(job_dir, exist_ok=True)

	try:
	original_path = os.path.join(job_dir, file.filename)
	file.save(original_path)
	wav_path = os.path.join(job_dir, "clean.wav")

	# Convert to safe format
	extract_audio(original_path, wav_path)

	text = transcribe(wav_path)
	sents = clean_sentences(text)

	if not sents: raise Exception("No speech detected.")

	summary, conclusion = summarize(sents)
	notes = to_paragraphs(sents)

	JOB_STORE[job_id].update({"summary": summary, "notes": notes, "conclusion": conclusion})
	build_vectors(job_id)

	return render_template("dashboard.html", active_tab="enterprise", job_id=job_id, summary=summary, transcript=notes, conclusion=conclusion)

	except Exception as e:
	return render_template("dashboard.html", active_tab="enterprise", error=str(e))
	finally:
	shutil.rmtree(job_dir, ignore_errors=True)

	@app.route("/live_submit", methods=["POST"])
	def live_submit():
	with LOCK: # Locking taaki dusra process clash na kare
	file = request.files.get("audio_file")
	if not file:
	return jsonify({"error": "No audio received"}), 400

	job_id = new_job()
	job_dir = os.path.join(BASE_DIR, job_id)
	os.makedirs(job_dir, exist_ok=True)

	try:
	# Live recording aksar .webm ya .ogg format mein hoti hai
	original_path = os.path.join(job_dir, "live_input.webm")
	file.save(original_path)

	wav_path = os.path.join(job_dir, "clean.wav")

	# Convert WebM/OGG to WAV for Whisper
	extract_audio(original_path, wav_path)

	# --- Process Audio (Same as Enterprise) ---
	text = transcribe(wav_path)
	sents = clean_sentences(text)

	if not sents: raise Exception("No speech detected in live recording.")

	summary, conclusion = summarize(sents)
	notes = to_paragraphs(sents)

	JOB_STORE[job_id].update({"summary": summary, "notes": notes, "conclusion": conclusion})
	build_vectors(job_id)

	# JSON response return karein kyuki ye AJAX call hoga
	return jsonify({
	"job_id": job_id,
	"summary": summary,
	"transcript": notes,
	"conclusion": conclusion,
	"status": "success"
	})

	except Exception as e:
	print(f"❌ Live Error: {e}")
	return jsonify({"error": str(e)}), 500
	finally:
	shutil.rmtree(job_dir, ignore_errors=True)

	@app.route("/ask", methods=["POST"])
	def ask():
	data = request.json if request.is_json else request.form
	jid = data.get("job_id")
	question = data.get("question")

	if not jid or jid not in JOB_STORE:
	return jsonify({"answer": "Session expired or invalid. Please upload again."})

	store = JOB_STORE[jid].get("vectors", [])
	if not store:
	return jsonify({"answer": "No content available to answer from."})

	try:
	q_vec = embedder.encode(question, normalize_embeddings=True)
	scored = sorted([(np.dot(q_vec, i["vector"]), i["text"]) for i in store], reverse=True)[:3]
	context_text = " ".join([t for _, t in scored])

	answer = generate_ai_answer(question, context_text)
	return jsonify({"answer": answer})
	except Exception as e:
	return jsonify({"answer": "I couldn't generate an answer due to an error."})

	# --- DOWNLOAD ROUTES (UNCHANGED BUT SAFE) ---
	@app.route("/download/word/<job_id>")
	def download_word(job_id):
	d = JOB_STORE.get(job_id)
	if not d: return "Expired ID", 404
	doc = Document()
	doc.add_heading("AI Summary Report", 0)
	doc.add_paragraph(f"Generated on: {time.ctime()}")
	doc.add_heading("Summary", 1)
	doc.add_paragraph(d["summary"])
	doc.add_heading("Conclusion", 1)
	doc.add_paragraph(d["conclusion"])
	doc.add_heading("Full Transcript", 1)
	doc.add_paragraph(d["notes"])

	path = f"{job_id}.docx"
	doc.save(path)
	return send_file(path, as_attachment=True)

	@app.route("/download/pdf/<job_id>")
	def download_pdf(job_id):
	d = JOB_STORE.get(job_id)
	if not d:
	return "Expired ID", 404

	pdf_path = f"{job_id}_MeetGenius_Report.pdf"

	c = canvas.Canvas(pdf_path, pagesize=A4)
	width, height = A4

	x_margin = 40
	y = height - 50

	def draw_text(title, text):
	nonlocal y
	c.setFont("Helvetica-Bold", 14)
	c.drawString(x_margin, y, title)
	y -= 25

	c.setFont("Helvetica", 11)
	lines = simpleSplit(text, "Helvetica", 11, width - 80)

	for line in lines:
	if y < 50:
	c.showPage()
	y = height - 50
	c.setFont("Helvetica", 11)
	c.drawString(x_margin, y, line)
	y -= 15

	y -= 20

	draw_text("AI Summary Report", f"Generated on: {time.ctime()}")
	draw_text("Summary", d["summary"])
	draw_text("Conclusion", d["conclusion"])
	draw_text("Full Transcript", d["notes"])

	c.save()

	return send_file(
	pdf_path,
	as_attachment=True,
	download_name="MeetGenius_AI_Report.pdf",
	mimetype="application/pdf"
	)


	# ---- CLEANUP THREAD ----
	def cleanup_old_jobs():
	while True:
	time.sleep(CLEANUP_INTERVAL)
	now = time.time()
	with LOCK:
	# Clean Dictionary
	keys_to_remove = [k for k, v in JOB_STORE.items() if now - v['created_at'] > JOB_TTL_SECONDS]
	for k in keys_to_remove:
	del JOB_STORE[k]

	# Clean Files
	for f in os.listdir("."):
	if f.endswith((".pdf", ".docx", ".wav")):
	try:
	if now - os.path.getmtime(f) > JOB_TTL_SECONDS:
	os.remove(f)
	except: pass
	print("🧹 Cleanup cycle completed.")

	if __name__ == "__main__":
	t = threading.Thread(target=cleanup_old_jobs, daemon=True)
	t.start()
	app.run(host="0.0.0.0", port=7860)