Spaces:

ranamhamoud
/

Authenticity

Sleeping

Authenticity / text_analyzer.py

Ranam Hamoud

Update files and add .gitignore, remove pycache from tracking

0b42831 25 days ago

4.84 kB

	import warnings
	warnings.filterwarnings("ignore")

	# try to import the desklib AI detector
	try:
	from plagiarism_detection import ai_plagiarism_detection
	DESKLIB_AVAILABLE = True
	except ImportError:
	DESKLIB_AVAILABLE = False
	print("Warning: plagiarism_detection module not found. Using fallback AI detection.")


	# class for detecting AI-generated text
	class AITextDetector:
	def __init__(self, device=None, threshold=0.78):
	self.threshold = threshold

	# check if desklib model is available
	if not DESKLIB_AVAILABLE:
	print("Warning: plagiarism_detection module not found. AI detection will not be available.")
	print("Ensure plagiarism_detection.py is in the same directory.")
	self.available = False
	else:
	print(f"Using Desklib AI text detector (threshold: {self.threshold})")
	self.available = True

	# main detection function
	def detect_ai_text(self, text):

	# return neutral result if detector not available
	if not self.available:
	return {
	'ai_generated': False,
	'confidence': 0.5,
	'indicators': [],
	'interpretation': "AI detection not available. Install plagiarism_detection module.",
	'model_used': 'N/A (module not found)'
	}

	# run detection using desklib model
	try:
	probability, ai_detected = ai_plagiarism_detection(
	text,
	threshold=self.threshold,
	show_results=False
	)

	return {
	'ai_generated': ai_detected,
	'confidence': float(probability),
	'indicators': self._identify_ai_indicators(probability),
	'interpretation': self._interpret_ai_detection(probability),
	'model_used': 'Desklib AI Detector v1.01'
	}
	except Exception as e:
	print(f"Something went wrong with AI detection: {e}")
	return {
	'ai_generated': False,
	'confidence': 0.5,
	'indicators': [],
	'interpretation': "Could not run AI detection",
	'model_used': 'Error'
	}

	# identify specific indicators based on probability
	def _identify_ai_indicators(self, probability):
	indicators = []

	if probability > 0.9:
	indicators.append("Very high AI probability (>90%)")
	elif probability > 0.7:
	indicators.append("High AI probability (70-90%)")
	elif probability > self.threshold:
	indicators.append(f"AI detected above threshold ({self.threshold*100:.0f}%)")

	return indicators

	# generate interpretation text
	def _interpret_ai_detection(self, score):
	interpretation = f"AI-Generated Text Detection:\n\n"
	interpretation += f"- AI Probability Score: {score*100:.1f}%\n"
	interpretation += f"- Detection Threshold: {self.threshold*100:.0f}%\n"

	return interpretation


	# main analyzer class that combines all text analysis
	class TextAuthenticityAnalyzer:

	def __init__(self, device=None, ai_threshold=0.78):
	# initialize AI detector
	self.ai_detector = AITextDetector(device=device, threshold=ai_threshold)

	# analyze text for authenticity
	def analyze(self, text):
	# run AI detection
	ai_results = self.ai_detector.detect_ai_text(text)

	# calculate authenticity score (inverse of AI probability)
	ai_penalty = ai_results['confidence']
	authenticity_score = 1.0 - ai_penalty

	# determine risk level based on authenticity
	if authenticity_score < 0.3:
	overall_assessment = "HIGH RISK: Strong AI-generated text indicators"
	risk_level = "high"
	elif authenticity_score < 0.5:
	overall_assessment = "MODERATE RISK: Likely AI-generated"
	risk_level = "moderate"
	elif authenticity_score < 0.7:
	overall_assessment = "LOW RISK: Some AI characteristics"
	risk_level = "low"
	else:
	overall_assessment = "AUTHENTIC: Text appears human-written"
	risk_level = "minimal"

	return {
	'authenticity_score': float(authenticity_score),
	'risk_level': risk_level,
	'overall_assessment': overall_assessment,
	'ai_detection': ai_results,
	}


	# test code - runs when script is executed directly
	if __name__ == "__main__":
	analyzer = TextAuthenticityAnalyzer()
	print("Text authenticity analyzer initialized.")
	print("Components: Plagiarism Detector + AI Text Detector")