huamnifierWithSimpleGrammer

Running

App Files Files

sashtech commited on Sep 2, 2024

Commit

85e8aa6

verified ·

1 Parent(s): 603305a

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -3

app.py CHANGED Viewed

@@ -6,6 +6,7 @@ import subprocess
 import nltk
 from nltk.corpus import wordnet
 from gensim import downloader as api
 # Ensure necessary NLTK data is downloaded
 nltk.download('wordnet')
@@ -28,6 +29,12 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english")
 model = AutoModelForSequenceClassification.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english").to(device)
 # AI detection function using DistilBERT
 def detect_ai_generated(text):
     inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=512).to(device)
@@ -45,7 +52,7 @@ def get_synonyms_nltk(word, pos):
         return [lemma.name() for lemma in lemmas]
     return []
-# Paraphrasing function using spaCy and NLTK (without grammar correction)
 def paraphrase_with_spacy_nltk(text):
     doc = nlp(text)
     paraphrased_words = []
@@ -73,7 +80,10 @@ def paraphrase_with_spacy_nltk(text):
     # Join the words back into a sentence
     paraphrased_sentence = ' '.join(paraphrased_words)
-    return paraphrased_sentence
 # Gradio interface definition
 with gr.Blocks() as interface:
@@ -81,7 +91,7 @@ with gr.Blocks() as interface:
         with gr.Column():
             text_input = gr.Textbox(lines=5, label="Input Text")
             detect_button = gr.Button("AI Detection")
-            paraphrase_button = gr.Button("Paraphrase with spaCy & NLTK")
         with gr.Column():
             output_text = gr.Textbox(label="Output")

 import nltk
 from nltk.corpus import wordnet
 from gensim import downloader as api
+from textblob import TextBlob  # Import TextBlob for grammar correction
 # Ensure necessary NLTK data is downloaded
 nltk.download('wordnet')
 tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english")
 model = AutoModelForSequenceClassification.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english").to(device)
+# Function to correct grammar using TextBlob
+def correct_grammar_with_textblob(text):
+    blob = TextBlob(text)
+    corrected_text = str(blob.correct())
+    return corrected_text
 # AI detection function using DistilBERT
 def detect_ai_generated(text):
     inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=512).to(device)
         return [lemma.name() for lemma in lemmas]
     return []
+# Paraphrasing function using spaCy and NLTK with TextBlob grammar correction
 def paraphrase_with_spacy_nltk(text):
     doc = nlp(text)
     paraphrased_words = []
     # Join the words back into a sentence
     paraphrased_sentence = ' '.join(paraphrased_words)
+    # Correct the grammar of the paraphrased sentence using TextBlob
+    corrected_sentence = correct_grammar_with_textblob(paraphrased_sentence)
+    return corrected_sentence
 # Gradio interface definition
 with gr.Blocks() as interface:
         with gr.Column():
             text_input = gr.Textbox(lines=5, label="Input Text")
             detect_button = gr.Button("AI Detection")
+            paraphrase_button = gr.Button("Paraphrase with spaCy & NLTK (Grammar Corrected with TextBlob)")
         with gr.Column():
             output_text = gr.Textbox(label="Output")