Spaces:

rairo
/

recruitment-api

Sleeping

App Files Files Community

recruitment-api / main.py

rairo

Update main.py

447acee verified 4 months ago

raw

history blame contribute delete

6.76 kB

	from flask import Flask, request, jsonify
	import re
	import os
	import json
	import tempfile
	import logging
	import google.generativeai as genai
	import pypdf
	from flask_cors import CORS

	# Setup logging
	logging.basicConfig(level=logging.INFO)

	app = Flask(__name__)
	CORS(app) # Enable CORS for all routes

	# Get API key securely
	api_key = os.getenv('Gemini')
	if not api_key:
	raise ValueError("Gemini API key not found in environment variables")

	def configure_gemini(api_key):
	"""Configure Gemini AI model."""
	try:
	genai.configure(api_key=api_key)
	return genai.GenerativeModel('gemini-2.0-flash-exp')
	except Exception as e:
	logging.error(f"Error configuring Gemini: {str(e)}")
	raise

	def read_pdf(file_path):
	"""Extract text from a PDF file."""
	try:
	text_content = []
	with open(file_path, 'rb') as file:
	pdf_reader = pypdf.PdfReader(file)
	for page in pdf_reader.pages:
	text = page.extract_text()
	if text:
	text_content.append(text)
	return "\n".join(text_content)
	except Exception as e:
	logging.error(f"Error reading PDF: {str(e)}")
	raise

	def extract_json_from_response(response_text):
	"""Extract valid JSON from Gemini's response."""
	try:
	json_match = re.search(r'\{.*\}', response_text, re.DOTALL)
	if not json_match:
	raise ValueError("No valid JSON found in response")

	json_str = json_match.group(0).replace('```json', '').replace('```', '').strip()
	return json.loads(json_str)
	except json.JSONDecodeError as e:
	logging.error(f"Error parsing JSON: {str(e)}")
	raise
	except Exception as e:
	logging.error(f"Unexpected error extracting JSON: {str(e)}")
	raise

	def process_with_gemini(model, prompt, text, answers_text=None):
	"""Send combined text (job description and applicant documents) to Gemini and return structured JSON response."""

	# Build the applicant section with answers if provided
	applicant_section = f"Applicant Documents:\n{text}"
	if answers_text:
	applicant_section += f"\n\nApplicant's Answers to Screening Questions:\n{answers_text}"

	full_prompt = f"""
	You are an expert HR recruiter. Based on the job description and the applicant's documents provided below, assess the applicant's suitability for the job.

	Job Description:
	{prompt}

	{applicant_section}

	Provide a detailed analysis that includes:
	- A score out of 100 evaluating the applicant's fit for the role.
	- A recommendation for hiring: either "hire" or "do not hire".
	- A clear justification for the decision.

	Return ONLY valid JSON with this exact structure:
	{{
	"score": <number>,
	"recommendation": "<hire/do not hire>",
	"justification": "<string>"
	}}
	"""
	try:
	response = model.generate_content([full_prompt])
	return extract_json_from_response(response.text)
	except Exception as e:
	logging.error(f"Error processing text with Gemini: {str(e)}")
	raise

	@app.route('/process-application', methods=['POST'])
	def process_application():
	"""
	Handle applicant documents and job details.
	Expects:
	- job_id: form data string
	- job_description: form data string
	- applicant_id: form data string
	- questions_answers: (optional) form data string - JSON string containing Q&A pairs
	- files: one or more PDF files (e.g., CV, cover letter)
	Returns a JSON response with score, recommendation, and justification.
	"""
	try:
	# Get job-related details from the form data
	job_id = request.form.get('job_id')
	job_description = request.form.get('job_description')
	applicant_id = request.form.get('applicant_id')
	questions_answers = request.form.get('questions_answers') # New field for Q&A

	if not job_id or not job_description or not applicant_id:
	return jsonify({'error': 'job_id, job_description, and applicant_id are required'}), 400

	# Ensure at least one file is uploaded
	if 'files' not in request.files:
	return jsonify({'error': 'No files uploaded'}), 400

	files = request.files.getlist('files')
	if len(files) == 0:
	return jsonify({'error': 'No files provided'}), 400

	combined_text = ""
	temp_files = []

	# Process each uploaded PDF file
	for file in files:
	if file.filename == '':
	continue
	if not file.filename.endswith('.pdf'):
	return jsonify({'error': f'File {file.filename} must be a PDF'}), 400
	# Save file to a temporary location
	temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".pdf")
	file.save(temp_file.name)
	temp_files.append(temp_file.name)
	# Extract text and combine
	combined_text += read_pdf(temp_file.name) + "\n\n"

	# Parse and format questions_answers if provided
	answers_text = None
	if questions_answers:
	try:
	qa_data = json.loads(questions_answers)
	# Format the Q&A data for better readability
	formatted_answers = []
	if isinstance(qa_data, list):
	for idx, qa in enumerate(qa_data, 1):
	question = qa.get('question', 'N/A')
	response = qa.get('response', 'N/A')
	formatted_answers.append(f"Q{idx}: {question}\nA{idx}: {response}")
	else:
	formatted_answers.append(str(qa_data))
	answers_text = "\n\n".join(formatted_answers)
	except json.JSONDecodeError:
	logging.warning("questions_answers is not valid JSON, treating as plain text")
	answers_text = questions_answers

	# Configure Gemini and process combined text
	model = configure_gemini(api_key)
	extracted_data = process_with_gemini(model, job_description, combined_text, answers_text)

	# Clean up temporary files
	for temp_file in temp_files:
	os.remove(temp_file)

	# Log the processing
	logging.info(f"Processed application for applicant_id: {applicant_id} for job_id: {job_id}")

	return jsonify(extracted_data)

	except ValueError as ve:
	logging.warning(f"Client error: {str(ve)}")
	return jsonify({'error': str(ve)}), 400
	except Exception as e:
	logging.error(f"Internal server error: {str(e)}")
	return jsonify({'error': 'Internal server error'}), 500

	if __name__ == '__main__':
	app.run(debug=True, host="0.0.0.0", port=7860)