EbadDev92t225 commited on
Commit
1ac38f8
·
verified ·
1 Parent(s): 32f259a

make model less aggressive

Browse files
Files changed (1) hide show
  1. moderator.py +1 -1
moderator.py CHANGED
@@ -242,7 +242,7 @@ class SimpleModerator:
242
  final_confidence = hate_score
243
 
244
  # If both pattern and model agree on FLAG, escalate to DELETE
245
- if pattern_decision == "FLAG" and (toxic_score > 0.80 or hate_score > 0.70):
246
  action = "delete"
247
  reason = f"Pattern + Model agreement: {reason}"
248
  final_confidence = max(pattern_confidence, toxic_score, hate_score)
 
242
  final_confidence = hate_score
243
 
244
  # If both pattern and model agree on FLAG, escalate to DELETE
245
+ if pattern_decision == "FLAG" and (toxic_score > 0.95 or hate_score > 0.90):
246
  action = "delete"
247
  reason = f"Pattern + Model agreement: {reason}"
248
  final_confidence = max(pattern_confidence, toxic_score, hate_score)