Spaces:

chitsanfei
/

review-screening-analyzer

Sleeping

chitsanfei

init: init

d082b18 5 months ago

33.9 kB

	import os
	from dotenv import load_dotenv
	import time
	import logging
	from datetime import datetime
	import gradio as gr
	from file_processor import FileProcessor
	from analyzer import PICOSAnalyzer
	from deduplicator import Deduplicator
	from result_processor import ResultProcessor

	# Configuration of directories
	BASE_DIR = os.path.dirname(os.path.abspath(__file__))
	DATA_DIR = os.path.join(BASE_DIR, "data")
	LOG_DIR = os.path.join(BASE_DIR, "logs")

	# Load .env file if it exists
	dotenv_path = os.path.join(os.path.dirname(__file__), '.env')
	if os.path.exists(dotenv_path):
	load_dotenv(dotenv_path)
	else:
	print("Warning: .env file not found.")

	# Initialize components for analysis, file processing, deduplication, and result processing
	analyzer = PICOSAnalyzer()
	file_processor = FileProcessor(DATA_DIR)
	model_results = {}
	deduplicator = Deduplicator()
	result_processor = ResultProcessor()

	# Ensure required directories exist
	for directory in [DATA_DIR, LOG_DIR]:
	try:
	os.makedirs(directory, exist_ok=True)
	except Exception as e:
	raise RuntimeError(f"Failed to create directory {directory}: {str(e)}")

	# Configure logging: log to both a file and the console
	try:
	log_file = os.path.join(LOG_DIR, f"picos_analysis_{datetime.now().strftime('%Y%m%d_%H%M%S')}.log")

	# File handler for logging to a file
	file_handler = logging.FileHandler(log_file, encoding='utf-8')
	file_handler.setLevel(logging.INFO)

	# Console handler for logging to the terminal
	console_handler = logging.StreamHandler()
	console_handler.setLevel(logging.INFO)

	# Formatter for log messages
	formatter = logging.Formatter('%(asctime)s - %(levelname)s - %(message)s')
	file_handler.setFormatter(formatter)
	console_handler.setFormatter(formatter)

	# Configure the root logger
	root_logger = logging.getLogger()

	root_logger.setLevel(logging.INFO)
	root_logger.addHandler(file_handler)
	root_logger.addHandler(console_handler)
	except Exception as e:
	print(f"Failed to initialize logging: {str(e)}")
	raise

	def create_gradio_interface():
	"""Create and return the Gradio interface for the PICOS Analysis System."""

	def parse_nbib(file) -> tuple:
	"""
	Parse a citation file in NBIB format.
	Returns a tuple containing the Excel output path and a preview text.
	"""
	try:
	if not file:
	return None, "No file uploaded"

	# Determine file type based on extension
	file_extension = os.path.splitext(file.name)[1].lower()

	if file_extension == '.nbib':
	output_path, preview = file_processor.parse_nbib(file.name)
	elif file_extension == '.ris':
	# Read file content to determine RIS format (Embase or Web of Science)
	with open(file.name, 'r', encoding='utf-8') as f:
	content = f.read()
	if 'T1 - ' in content: # Embase RIS format
	output_path, preview = file_processor.parse_embase_ris(file.name)
	else: # Assume Web of Science RIS format
	output_path, preview = file_processor.parse_wos_ris(file.name)
	else:
	return None, "Unsupported file format. Please upload a .nbib or .ris file"

	if not output_path:
	return None, "Failed to parse file"

	return output_path, preview

	except Exception as e:
	error_msg = f"Error parsing file: {str(e)}"
	logging.error(error_msg)
	return None, error_msg

	def parse_scopus(file) -> tuple:
	"""
	Parse a Scopus RIS file.
	Returns a tuple containing the Excel output path and a preview text.
	"""
	try:
	if not file:
	return None, "No file uploaded"
	output_path, preview = file_processor.parse_scopus_ris(file.name)
	if not output_path:
	return None, "Failed to parse file"
	return output_path, preview
	except Exception as e:
	error_msg = f"Error parsing Scopus file: {str(e)}"
	logging.error(error_msg)
	return None, error_msg

	def update_picos_criteria(p, i, c, o, s):
	"""Update the PICOS criteria used for analysis."""
	try:
	analyzer.update_picos_criteria({
	"population": p.strip(),
	"intervention": i.strip(),
	"comparison": c.strip(),
	"outcome": o.strip(),
	"study_design": s.strip()
	})
	return "✓ PICOS criteria updated successfully"
	except Exception as e:
	return f"❌ Error updating PICOS criteria: {str(e)}"

	def update_model_settings(model_key, api_url, api_key, model_name, temperature, max_tokens, batch_size, threads, prompt, is_inference, timeout):
	"""Update the settings for a specified model."""
	try:
	analyzer.update_model_config(model_key, {
	"api_url": api_url.strip(),
	"api_key": api_key.strip(),
	"model": model_name.strip(),
	"temperature": float(temperature),
	"max_tokens": int(max_tokens),
	"batch_size": int(batch_size),
	"threads": int(threads),
	"is_inference": bool(is_inference),
	"timeout": float(timeout),
	"updated": True # mark as manually updated
	})
	analyzer.update_prompt(model_key, prompt.strip())
	return "✓ Settings updated successfully"
	except Exception as e:
	return f"❌ Error updating settings: {str(e)}"

	def test_connection(model_key):
	"""Test the API connection for a specified model."""
	try:
	result = analyzer.test_api_connection(model_key)
	return result
	except Exception as e:
	return f"❌ Error testing connection: {str(e)}"

	def process_model(input_file, model_key, model_a_input=None, model_b_input=None):
	"""
	Process analysis for a single model and return the results.
	For Model B and C, the required previous results files must be provided.
	"""
	try:
	logging.info(f"Loading input file for {model_key.upper()}...")
	df = file_processor.load_excel(input_file.name)
	if df is None:
	return None, "Failed to load Excel file"

	# For Model B, require Model A results; for Model C, require both Model A and B results
	if model_key == "model_b":
	if model_a_input is None or not os.path.exists(model_a_input.name):
	return None, "Model A results file required for MODEL_B"
	model_results["model_a"] = file_processor.load_excel(model_a_input.name)
	elif model_key == "model_c":
	logging.info("Loading Model A and B results for Model C analysis...")
	if model_a_input is None or not os.path.exists(model_a_input.name) or \
	model_b_input is None or not os.path.exists(model_b_input.name):
	return None, "Both Model A and B results files required for MODEL_C"
	model_results["model_a"] = file_processor.load_excel(model_a_input.name)
	model_results["model_b"] = file_processor.load_excel(model_b_input.name)

	# Process the model
	logging.info(f"Starting {model_key.upper()} analysis...")
	total_rows = len(df)
	processed_rows = 0
	errors = 0
	empty_abstracts = 0
	start_time = time.time()

	def progress_callback(row_index, error=False, is_empty=False):
	nonlocal processed_rows, errors, empty_abstracts
	# Increase the count only when the actual processing is complete
	if not error:
	processed_rows += 1
	elif is_empty:
	empty_abstracts += 1
	else:
	errors += 1

	# Calculate progress and time estimates
	elapsed_time = time.time() - start_time
	progress = processed_rows / total_rows
	if progress > 0:
	# Use moving averages to smooth time estimates
	avg_time_per_item = elapsed_time / (processed_rows + errors + empty_abstracts)
	remaining_items = total_rows - (processed_rows + errors + empty_abstracts)
	remaining_time = avg_time_per_item * remaining_items

	# Use the batch size of the model to control the log output frequency
	batch_size = analyzer.model_manager.get_config(model_key)["batch_size"]
	if (processed_rows + errors + empty_abstracts) % batch_size == 0:
	logging.info(f"{model_key.upper()} Progress: {processed_rows + errors + empty_abstracts}/{total_rows} rows "
	f"({(processed_rows + errors + empty_abstracts) / total_rows:.1%}) - "
	f"Processed: {processed_rows}, Errors: {errors}, Empty: {empty_abstracts} - "
	f"Elapsed: {elapsed_time:.1f}s, Remaining: {remaining_time:.1f}s")

	results_df = analyzer.process_batch(df, model_key, model_results, progress_callback)

	if results_df is None:
	return None, f"{model_key.upper()} failed to process results"

	# Save results immediately with fixed path in DATA_DIR
	output_file = os.path.join(DATA_DIR, f"{model_key}_results.xlsx")
	if model_key == "model_c":
	# For Model C, merge all results before saving
	merged_df = analyzer.merge_results(df, {
	"model_a": model_results["model_a"],
	"model_b": model_results["model_b"],
	"model_c": results_df
	})
	if not file_processor.save_excel(merged_df, output_file):
	return None, f"Failed to save {model_key.upper()} results"
	else:
	# For Model A and B, save individual results
	if not file_processor.save_excel(results_df, output_file):
	return None, f"Failed to save {model_key.upper()} results"

	total_time = time.time() - start_time
	completion_msg = (f"{model_key.upper()} analysis completed in {total_time:.1f}s - "
	f"Processed {processed_rows} rows with {errors} errors")
	logging.info(completion_msg)

	# Return the full path to the saved file with gr.update
	if os.path.exists(output_file):
	return gr.update(value=output_file), completion_msg
	else:
	return None, f"Failed to verify {model_key.upper()} results file"

	except Exception as e:
	error_msg = f"Error in {model_key.upper()} analysis: {str(e)}"
	logging.error(error_msg)
	return None, error_msg

	def merge_results_with_files(input_file, model_a_file, model_b_file, model_c_file):
	"""
	Merge all model results from the provided files and export the merged results as an Excel file.
	"""
	if not all([input_file, model_a_file, model_b_file]):
	return None, "Original file, Model A and B results are required"

	try:
	df = file_processor.load_excel(input_file.name)
	model_a_results = file_processor.load_excel(model_a_file.name)
	model_b_results = file_processor.load_excel(model_b_file.name)
	model_c_results = file_processor.load_excel(model_c_file.name) if model_c_file else None

	if any(result is None for result in [df, model_a_results, model_b_results]):
	return None, "Failed to load one or more required files"

	model_results["model_a"] = model_a_results
	model_results["model_b"] = model_b_results
	if model_c_results is not None:
	model_results["model_c"] = model_c_results

	merged_df = analyzer.merge_results(df, model_results)

	final_filename = os.path.join(DATA_DIR, "final_results.xlsx")
	result_processor.export_to_excel(merged_df, final_filename)

	return final_filename, "Results merged successfully"
	except Exception as e:
	return None, f"Error merging results: {str(e)}"

	def run_all_models(input_file):
	"""Run analysis pipeline for all models with streaming updates"""
	try:
	# Read Excel file using file processor
	df = file_processor.load_excel(input_file.name)
	if df is None:
	yield [None, None, None, None, "Failed to load input file"]
	return

	# --- Process Model A ---
	logging.info("Starting Model A analysis...")
	model_a_results = analyzer.process_batch(df, "model_a")
	if model_a_results is None:
	yield [None, None, None, None, "Model A failed to process results"]
	return

	# Save Model A results with fixed path
	model_a_path = os.path.join(DATA_DIR, "model_a_results.xlsx")
	if not file_processor.save_excel(model_a_results, model_a_path):
	yield [None, None, None, None, "Failed to save Model A results"]
	return
	model_results["model_a"] = model_a_results
	status_msg = "Model A completed successfully"
	# Yield update: Model A result available
	yield [gr.update(value=model_a_path), None, None, None, status_msg]

	# --- Process Model B ---
	logging.info("Starting Model B analysis...")
	model_b_results = analyzer.process_batch(df, "model_b", {"model_a": model_a_results})
	if model_b_results is None:
	yield [gr.update(value=model_a_path), None, None, None, "Model B failed to process results"]
	return

	# Save Model B results with fixed path
	model_b_path = os.path.join(DATA_DIR, "model_b_results.xlsx")
	if not file_processor.save_excel(model_b_results, model_b_path):
	yield [gr.update(value=model_a_path), None, None, None, "Failed to save Model B results"]
	return
	model_results["model_b"] = model_b_results
	status_msg = "Model B completed successfully"
	# Yield update: Both Model A and B results available
	yield [gr.update(value=model_a_path), gr.update(value=model_b_path), None, None, status_msg]

	# --- Process Model C ---
	logging.info("Starting Model C analysis...")
	model_c_results = analyzer.process_batch(df, "model_c", {
	"model_a": model_a_results,
	"model_b": model_b_results
	})

	model_c_path = None
	if model_c_results is not None:
	# Save Model C results with fixed path
	model_c_path = os.path.join(DATA_DIR, "model_c_results.xlsx")
	if not file_processor.save_excel(model_c_results, model_c_path):
	yield [gr.update(value=model_a_path), gr.update(value=model_b_path), None, None, "Failed to save Model C results"]
	return
	model_results["model_c"] = model_c_results
	status_msg = "Model C completed successfully"
	# Yield update: Model A, B and C results available
	yield [gr.update(value=model_a_path), gr.update(value=model_b_path), gr.update(value=model_c_path), None, status_msg]

	# Merge results
	logging.info("Merging results...")
	merged_df = analyzer.merge_results(df, model_results)

	# Save final results with fixed path
	final_path = os.path.join(DATA_DIR, "final_results.xlsx")
	if not file_processor.save_excel(merged_df, final_path):
	yield [gr.update(value=model_a_path), gr.update(value=model_b_path), gr.update(value=model_c_path), None, "Failed to save final results"]
	return

	completion_msg = "All models completed successfully"
	# Yield final update with all results available
	yield [gr.update(value=model_a_path), gr.update(value=model_b_path), gr.update(value=model_c_path), gr.update(value=final_path), completion_msg]

	except Exception as e:
	error_msg = f"Error in pipeline: {str(e)}"
	logging.error(error_msg)
	yield [None, None, None, None, error_msg]

	def process_deduplication(files, threshold):
	"""
	Process deduplication for multiple Excel files.
	The function identifies duplicate entries based on a similarity threshold.
	"""
	try:
	if not files:
	return None, None, "No files uploaded"

	dataframes = []
	for file in files:
	if not file:
	continue
	df = file_processor.load_excel(file.name)
	if df is None:
	return None, None, f"Failed to load file: {file.name}"
	dataframes.append(df)

	if not dataframes:
	return None, None, "No valid files to process"

	unique_df, clusters_df = deduplicator.process_dataframes(dataframes, threshold)

	unique_path = file_processor.save_excel(unique_df, "deduplicated_data.xlsx")
	clusters_path = file_processor.save_excel(clusters_df, "duplicate_clusters.xlsx")

	if not unique_path or not clusters_path:
	return None, None, "Failed to save results"

	status_msg = f"Deduplication completed successfully:\n"
	status_msg += f"Original entries: {sum(len(df) for df in dataframes)}\n"
	status_msg += f"Unique entries: {len(unique_df)}\n"
	status_msg += f"Duplicate clusters: {len(clusters_df['Cluster_ID'].unique()) if len(clusters_df) > 0 else 0}"

	return unique_path, clusters_path, status_msg

	except Exception as e:
	error_msg = f"Error in deduplication: {str(e)}"
	logging.error(error_msg)
	return None, None, error_msg

	# Build the Gradio interface
	interface = gr.Blocks(title="PICOS Analysis System")

	with interface:
	gr.Markdown("""
	<div style="text-align: center;">
	<h1>PICOS Literature Analysis System</h1>
	<p>This system uses a multi-model approach to analyze medical literature abstracts.</p>
	</div>
	""")

	with gr.Tab("Instructions"):
	gr.Markdown("""
	## System Overview
	This system helps researchers analyze medical literature by providing tools for citation management,
	deduplication, and automated PICOS analysis using multiple language models.

	## Workflow Steps
	Citation Processing -> Deduplication (Optional) -> PICOS Analysis Setup -> Analysis Execution

	## File Format Requirements
	### Input Files
	- Pubmed: NBIB format (.nbib)
	- Embase: RIS format (.ris)
	- Web of Science: RIS format (.ris)
	- Scopus: RIS format (.ris)

	### Processed Format
	The system will generate standardized Excel files (XLSX format) with these columns:
	- Index: Unique identifier for each abstract
	- Title: Article title
	- Authors: Author list (semicolon-separated)
	- Abstract: Full abstract text
	- DOI: Digital Object Identifier (when available)

	### Analysis Results
	Each model will generate an Excel file containing:
	- All original citation data
	- PICOS analysis results
	- Inclusion/exclusion decisions
	- Reasoning for decisions
	""")

	with gr.Tab("Citation File Processing"):
	with gr.Tab("Pubmed"):
	gr.Markdown("""
	## Pubmed NBIB Processing
	Upload a .nbib file from Pubmed to extract and convert it to Excel format. The extracted data will include:
	- DOI
	- Title
	- Authors
	- Abstract
	""")

	with gr.Row():
	nbib_file = gr.File(label="Upload NBIB File", file_types=[".nbib"])
	process_nbib_btn = gr.Button("Process NBIB File")

	with gr.Row():
	nbib_preview = gr.Textbox(label="Preview", lines=20)
	nbib_output = gr.File(label="Download Excel")

	process_nbib_btn.click(
	parse_nbib,
	inputs=[nbib_file],
	outputs=[nbib_output, nbib_preview]
	)

	with gr.Tab("Embase"):
	gr.Markdown("""
	## Embase RIS Processing
	Upload a .ris file from Embase to extract and convert it to Excel format. The extracted data will include:
	- DOI
	- Title
	- Authors
	- Abstract
	""")

	with gr.Row():
	embase_file = gr.File(label="Upload Embase RIS File", file_types=[".ris"])
	process_embase_btn = gr.Button("Process Embase RIS File")

	with gr.Row():
	embase_preview = gr.Textbox(label="Preview", lines=20)
	embase_output = gr.File(label="Download Excel")

	process_embase_btn.click(
	parse_nbib,
	inputs=[embase_file],
	outputs=[embase_output, embase_preview]
	)

	with gr.Tab("Web of Science"):
	gr.Markdown("""
	## Web of Science RIS Processing
	Upload a .ris file from Web of Science to extract and convert it to Excel format. The extracted data will include:
	- DOI
	- Title
	- Authors
	- Abstract
	""")

	with gr.Row():
	wos_file = gr.File(label="Upload WOS RIS File", file_types=[".ris"])
	process_wos_btn = gr.Button("Process WOS RIS File")

	with gr.Row():
	wos_preview = gr.Textbox(label="Preview", lines=20)
	wos_output = gr.File(label="Download Excel")

	process_wos_btn.click(
	lambda file: parse_nbib(file) if file else (None, "No file uploaded"),
	inputs=[wos_file],
	outputs=[wos_output, wos_preview]
	)

	with gr.Tab("Scopus"):
	gr.Markdown("""
	## Scopus RIS Processing
	Upload a .ris file from Scopus to extract and convert it to Excel format. The extracted data will include:
	- DOI
	- Title
	- Authors
	- Abstract
	""")

	with gr.Row():
	scopus_file = gr.File(label="Upload Scopus RIS File", file_types=[".ris"])
	process_scopus_btn = gr.Button("Process Scopus RIS File")

	with gr.Row():
	scopus_preview = gr.Textbox(label="Preview", lines=20)
	scopus_output = gr.File(label="Download Excel")

	process_scopus_btn.click(
	parse_scopus,
	inputs=[scopus_file],
	outputs=[scopus_output, scopus_preview]
	)

	with gr.Tab("Deduplication"):
	gr.Markdown("""
	## Citation Deduplication
	Upload multiple Excel files to remove duplicate entries across different citation sources.
	The system will identify similar entries based on title and author information.

	### Features:
	- Support for multiple Excel files
	- Adjustable similarity threshold
	- Detailed duplicate clusters report
	- Standardized output format
	""")

	with gr.Row():
	input_files = gr.File(
	label="Upload Excel Files",
	file_types=[".xlsx", ".xls"],
	file_count="multiple"
	)
	threshold = gr.Slider(
	label="Similarity Threshold",
	minimum=0.1,
	maximum=1.0,
	value=0.8,
	step=0.05,
	info="Higher values mean stricter matching (0.8 recommended)"
	)

	with gr.Row():
	process_btn = gr.Button("Process Deduplication")

	with gr.Row():
	status = gr.Textbox(label="Status", lines=5)

	with gr.Row():
	unique_output = gr.File(label="Download Deduplicated Data")
	clusters_output = gr.File(label="Download Duplicate Clusters")

	process_btn.click(
	process_deduplication,
	inputs=[input_files, threshold],
	outputs=[unique_output, clusters_output, status]
	)

	with gr.Tab("LLM Analysis"):
	with gr.Tab("PICOS Criteria"):
	gr.Markdown("""
	## PICOS Criteria Settings
	Define the standard PICOS criteria that will be used by all models.
	These criteria will be used to evaluate whether each article meets the requirements.
	""")

	with gr.Group("Standard PICOS Criteria"):
	population = gr.Textbox(label="Population", value=analyzer.picos_criteria["population"],
	placeholder="e.g., patients with hepatocellular carcinoma")
	intervention = gr.Textbox(label="Intervention", value=analyzer.picos_criteria["intervention"],
	placeholder="e.g., immunotherapy or targeted therapy")
	comparison = gr.Textbox(label="Comparison", value=analyzer.picos_criteria["comparison"],
	placeholder="e.g., standard therapy or placebo")
	outcome = gr.Textbox(label="Outcome", value=analyzer.picos_criteria["outcome"],
	placeholder="e.g., survival or response rate")
	study_design = gr.Textbox(label="Study Design", value=analyzer.picos_criteria["study_design"],
	placeholder="e.g., randomized controlled trial")

	update_picos_btn = gr.Button("Update PICOS Criteria")
	picos_status = gr.Textbox(label="Status")

	update_picos_btn.click(
	update_picos_criteria,
	inputs=[population, intervention, comparison, outcome, study_design],
	outputs=picos_status
	)

	with gr.Tab("Model Settings"):
	for model_key in ["model_a", "model_b", "model_c"]:
	with gr.Group(f"{model_key.upper()} Settings"):
	config = analyzer.model_manager.get_config(model_key)
	api_url = gr.Textbox(label="API URL", value=config["api_url"])
	api_key = gr.Textbox(label="API Key", value=config["api_key"])
	model_name = gr.Textbox(label="Model", value=config["model"])
	is_inference = gr.Checkbox(
	label="Inference Model",
	value=config.get("is_inference", False),
	info="Enable inference compatibility mode for models that return reasoning process"
	)
	temperature = gr.Slider(label="Temperature", minimum=0, maximum=10, value=config["temperature"])
	max_tokens = gr.Number(label="Max Tokens", value=config["max_tokens"])
	batch_size = gr.Number(label="Batch Size", value=config["batch_size"])
	threads = gr.Slider(label="Threads", minimum=1, maximum=32, step=1, value=config["threads"])
	timeout = gr.Number(label="Timeout (seconds)", value=config.get("timeout", 180))
	prompt = gr.Textbox(label="Prompt Template", value=analyzer.prompt_manager.get_prompt(model_key), lines=10)

	update_btn = gr.Button(f"Update {model_key.upper().replace('_', ' ')} Settings")
	test_btn = gr.Button(f"Test {model_key.upper().replace('_', ' ')} Connection")
	status = gr.Textbox(label="Status", lines=10)

	update_btn.click(
	update_model_settings,
	inputs=[gr.Textbox(value=model_key, visible=False),
	api_url,
	api_key,
	model_name,
	temperature,
	max_tokens,
	batch_size,
	threads,
	prompt,
	is_inference,
	timeout],
	outputs=status
	)
	test_btn.click(
	test_connection,
	inputs=[gr.Textbox(value=model_key, visible=False)],
	outputs=status
	)

	with gr.Tab("Analysis"):
	with gr.Row():
	input_file = gr.File(label="Original Excel File")
	model_a_input = gr.File(label="Model A Results")
	model_b_input = gr.File(label="Model B Results")
	model_c_input = gr.File(label="Model C Results")

	with gr.Row():
	model_a_btn = gr.Button("Run Model A")
	model_b_btn = gr.Button("Run Model B")
	model_c_btn = gr.Button("Run Model C")
	merge_btn = gr.Button("Merge Results")
	# Register run_all_btn with streaming enabled for intermediate updates
	run_all_btn = gr.Button("Run All", variant="primary")

	status = gr.Textbox(label="Status")

	with gr.Row():
	model_a_output = gr.File(label="Model A Results", interactive=True)
	model_b_output = gr.File(label="Model B Results", interactive=True)
	model_c_output = gr.File(label="Model C Results", interactive=True)
	final_output = gr.File(label="Final Results", interactive=True)

	# Individual model runs
	model_a_btn.click(
	lambda x: process_model(x, "model_a"),
	inputs=[input_file],
	outputs=[model_a_output, status]
	)
	model_b_btn.click(
	lambda x, y: process_model(x, "model_b", y),
	inputs=[input_file, model_a_input],
	outputs=[model_b_output, status]
	)
	model_c_btn.click(
	lambda x, y, z: process_model(x, "model_c", y, z),
	inputs=[input_file, model_a_input, model_b_input],
	outputs=[model_c_output, status]
	)
	merge_btn.click(
	merge_results_with_files,
	inputs=[input_file, model_a_input, model_b_input, model_c_input],
	outputs=[final_output, status]
	)
	run_all_btn.click(
	fn=run_all_models,
	inputs=[input_file],
	outputs=[model_a_output, model_b_output, model_c_output, final_output, status]
	)

	return interface

	if __name__ == "__main__":
	interface = create_gradio_interface()
	if interface:
	interface.launch(server_name="0.0.0.0", server_port=7860, pwa=True)
	else:
	print("Error: Failed to create Gradio interface")