Spaces:

Asarkar07
/

test_video_summarizer

Sleeping

App Files Files Community

test_video_summarizer / app.py

Asarkar07

Update app.py

f19bcb5 verified 7 months ago

raw

history blame contribute delete

5.81 kB

	import gradio as gr
	import os
	import uuid
	import tempfile
	from method import *

	VECTOR_DB = None
	CAPTIONS = []
	FRAMES = []
	caption_text = []
	caption_embedding = []
	extracted_face = []
	face_frames = []
	face_name_inputs = []

	# Gradio UI components (to be populated later)
	face_image_boxes = []
	face_name_inputs = []

	def handle_query(text):
	if VECTOR_DB is None:
	return "Please process a video first.", None
	idx = search_query(text, VECTOR_DB)
	return CAPTIONS[idx], FRAMES[idx]

	def save_face_names(*names):
	face_name_map = {f"face_{i}": names[i] for i in range(len(names))}
	print("Saved Names Mapping:", face_name_map)
	return "✅ Names saved for all faces."


	def prepare_faces_and_show():
	if not extracted_face:

	updates = [gr.update(value="❌ No faces extracted yet.")]
	updates.extend([gr.update(visible=False) for _ in range(40)])
	return updates

	image_updates = []
	textbox_updates = []

	for i in range(20):
	if i < len(extracted_face):
	face_img = extracted_face[i]["face"]
	image_updates.append(gr.update(value=face_img, visible=True))
	textbox_updates.append(gr.update(visible=True, value=""))
	else:
	image_updates.append(gr.update(visible=False))
	textbox_updates.append(gr.update(visible=False))
	status_update = [gr.update(value="✅ Faces ready. Enter names below.")]
	return status_update + image_updates + textbox_updates


	def process_youtube_link(video_file):
	global VECTOR_DB, CAPTIONS, FRAMES, caption_text, caption_embedding

	try:
	if video_file is None:
	return "❌ Please upload a video file."

	# Reset state for new video
	caption_text.clear()
	caption_embedding.clear()


	gr.Info("Extracting frames...")
	frames = extract_unique_frames(video_file)
	print('extract_unique_frames done')

	gr.Info("Generating captions...")
	for i, frame in enumerate(frames):
	caption_text.append(caption_image(frame))
	print('caption done')

	gr.Info("Creating embeddings...")
	for caption in caption_text:
	caption_embedding.append(embed_func(caption))

	gr.Info("Building vector store...")
	VECTOR_DB = build_vector_store(embed=np.array(caption_embedding))
	print('vector store done')

	CAPTIONS = caption_text
	FRAMES = frames

	return "✅ Processing complete. You can now enter a query."
	except Exception as e:
	return f"❌ Error: {str(e)}"


	def face_detect(video_file):
	global face_frames, extracted_face
	try:
	if video_file is None:
	return "❌ Please upload a video file."

	extracted_face.clear()

	gr.Info("Extracting frames...")
	face_frames = extract_unique_frames(video_file, interval_sec = 5)
	# face_frames = np.array([np.array(frame) for frame in face_frames])
	print('extract_unique_frames done')
	print(type(face_frames[0]))

	for i, frame in enumerate(face_frames):
	print('f frm:', i)
	# face_crop returns list of dicts per image — loop over them
	try:
	cropped_faces = face_crop(frame)
	extracted_face.extend(cropped_faces)
	print('extracted_face: ', len(extracted_face))
	except:
	pass

	print('extracted_face done')
	return "✅ Face extraction done. Click 'Show Faces' to review."
	except Exception as e:
	print('error: ', e)
	return f"❌ Error: {str(e)}"


	with gr.Blocks() as demo:
	gr.Markdown("# 🎥 Upload Your Video, CHAT_RAG")

	with gr.Tabs():
	with gr.TabItem("Video Upload & Query"):
	video_input = gr.Video(label="Upload video file (MP4, AVI, etc.)")
	process_button = gr.Button("Submit")
	process_output = gr.Textbox(label="Status")

	query_input = gr.Textbox(label="Enter a query")
	query_button = gr.Button("Search")
	query_caption = gr.Textbox(label="Matching Caption")
	query_image = gr.Image(label="Matching Frame")

	process_button.click(fn=process_youtube_link, inputs=video_input, outputs=process_output)
	query_button.click(fn=handle_query, inputs=query_input, outputs=[query_caption, query_image])



	with gr.TabItem("Face Extractor"):
	gr.Markdown("### 🧠 Upload a video, detect faces, assign names")

	face_video_input = gr.Video(label="Upload video for face extraction")
	face_process_button = gr.Button("Submit")
	face_status = gr.Textbox(label="Status")

	face_process_button.click(fn=face_detect, inputs=face_video_input, outputs=face_status)

	show_faces_btn = gr.Button("Show Faces")

	# Scrollable display (row of faces with textboxes)
	with gr.Row():
	for i in range(20):
	with gr.Column(visible=True) as col:
	img_box = gr.Image(label=f"Face {i+1}", interactive=False, visible=False)
	txt_box = gr.Textbox(label="Enter Name", visible=False)
	face_image_boxes.append(img_box)
	face_name_inputs.append(txt_box)

	save_names_btn = gr.Button("Save Names")

	show_faces_btn.click(
	fn=prepare_faces_and_show,
	outputs=[face_status] + face_image_boxes + face_name_inputs
	)

	save_names_btn.click(
	fn=save_face_names,
	inputs=face_name_inputs,
	outputs=face_status
	)

	demo.launch(debug = True)