Spaces:

yasserrmd
/

IntegrityChecker

Sleeping

yasserrmd commited on Nov 4, 2024

Commit

602cd0f

verified ·

1 Parent(s): addd1a8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -22,11 +22,11 @@ CONFIG = synthid_mixin.DEFAULT_WATERMARKING_CONFIG
 # Function to check for AI-generated content using SynthID and highlight watermark
 @spaces.GPU
 def check_plagiarism(text):
     # Logits processor for SynthID
     logits_processor = logits_processing.SynthIDLogitsProcessor(
         **CONFIG, top_k=40, temperature=0.5
     )
     # Tokenize and process the input text
     inputs = tokenizer(text, return_tensors="pt").to(DEVICE)
@@ -49,9 +49,10 @@ def check_plagiarism(text):
         token_scores = outputs.scores
         # Loop through each generated token and its corresponding score
-        for token, score in zip(generated_tokens, token_scores):
-            processed_score = logits_processor(score)
-            token_text = tokenizer.decode(token)
             # If processed score indicates watermark, highlight this token
             if processed_score.mean().item() > 0.5:

 # Function to check for AI-generated content using SynthID and highlight watermark
 @spaces.GPU
 def check_plagiarism(text):
     # Logits processor for SynthID
     logits_processor = logits_processing.SynthIDLogitsProcessor(
         **CONFIG, top_k=40, temperature=0.5
     )
     # Tokenize and process the input text
     inputs = tokenizer(text, return_tensors="pt").to(DEVICE)
         token_scores = outputs.scores
         # Loop through each generated token and its corresponding score
+        for token_id, score in zip(generated_tokens, token_scores):
+            # Apply SynthIDLogitsProcessor to each score by calling it with 'scores=score'
+            processed_score = logits_processor(scores=score)
+            token_text = tokenizer.decode(token_id.unsqueeze(0))  # Decode token_id for individual token text
             # If processed score indicates watermark, highlight this token
             if processed_score.mean().item() > 0.5: