huamnifierWithSimpleGrammer

Running

App Files Files

sashtech commited on Sep 11, 2024

Commit

9ea0d50

verified ·

1 Parent(s): aa379a6

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -28

app.py CHANGED Viewed

@@ -5,31 +5,31 @@ import spacy
 import subprocess
 import nltk
 from nltk.corpus import wordnet
-from spellchecker import SpellChecker  # Import SpellChecker for spelling correction
 # Initialize the English text classification pipeline for AI detection
 pipeline_en = pipeline(task="text-classification", model="Hello-SimpleAI/chatgpt-detector-roberta")
 # Function to predict the label and score for English text (AI Detection)
 def predict_en(text):
     res = pipeline_en(text)[0]
     return res['label'], res['score']
-# Ensure necessary NLTK data is downloaded for Humanifier
 nltk.download('wordnet')
 nltk.download('omw-1.4')
-# Ensure the SpaCy model is installed for Humanifier
 try:
     nlp = spacy.load("en_core_web_sm")
 except OSError:
     subprocess.run(["python", "-m", "spacy", "download", "en_core_web_sm"])
     nlp = spacy.load("en_core_web_sm")
-# Initialize SpellChecker
-spell = SpellChecker()
-# Function to get synonyms using NLTK WordNet (Humanifier)
 def get_synonyms_nltk(word, pos):
     synsets = wordnet.synsets(word, pos=pos)
     if synsets:
@@ -37,7 +37,7 @@ def get_synonyms_nltk(word, pos):
         return [lemma.name() for lemma in lemmas]
     return []
-# Function to capitalize the first letter of sentences and proper nouns (Humanifier)
 def capitalize_sentences_and_nouns(text):
     doc = nlp(text)
     corrected_text = []
@@ -55,7 +55,20 @@ def capitalize_sentences_and_nouns(text):
     return ' '.join(corrected_text)
-# Function to correct singular/plural errors (Singular/Plural Correction)
 def correct_singular_plural_errors(text):
     doc = nlp(text)
     corrected_text = []
@@ -77,18 +90,6 @@ def correct_singular_plural_errors(text):
     return ' '.join(corrected_text)
-# Function to correct tense errors in a sentence (Tense Correction)
-def correct_tense_errors(text):
-    doc = nlp(text)
-    corrected_text = []
-    for token in doc:
-        if token.pos_ == "VERB" and token.dep_ in {"aux", "auxpass"}:
-            lemma = wordnet.morphy(token.text, wordnet.VERB) or token.text
-            corrected_text.append(lemma)
-        else:
-            corrected_text.append(token.text)
-    return ' '.join(corrected_text)
 # Function to check and correct article errors
 def correct_article_errors(text):
     doc = nlp(text)
@@ -122,11 +123,11 @@ def replace_with_synonym(token):
     if synonyms:
         synonym = synonyms[0]
-        if token.tag_ == "VBG":
             synonym = synonym + 'ing'
-        elif token.tag_ == "VBD" or token.tag_ == "VBN":
             synonym = synonym + 'ed'
-        elif token.tag_ == "VBZ":
             synonym = synonym + 's'
         return synonym
     return token.text
@@ -148,9 +149,9 @@ def ensure_subject_verb_agreement(text):
     corrected_text = []
     for token in doc:
         if token.dep_ == "nsubj" and token.head.pos_ == "VERB":
-            if token.tag_ == "NN" and token.head.tag_ != "VBZ":
                 corrected_text.append(token.head.lemma_ + "s")
-            elif token.tag_ == "NNS" and token.head.tag_ == "VBZ":
                 corrected_text.append(token.head.lemma_)
         corrected_text.append(token.text)
     return ' '.join(corrected_text)
@@ -158,10 +159,17 @@ def ensure_subject_verb_agreement(text):
 # Function to correct spelling errors
 def correct_spelling(text):
     words = text.split()
-    corrected_words = [spell.candidates(word) or word for word in words]
     return ' '.join(corrected_words)
-# Function to paraphrase, correct grammar, and fix spelling errors
 def paraphrase_and_correct(text):
     # Capitalize first to ensure proper noun capitalization
     paraphrased_text = capitalize_sentences_and_nouns(text)

 import subprocess
 import nltk
 from nltk.corpus import wordnet
+from spellchecker import SpellChecker
 # Initialize the English text classification pipeline for AI detection
 pipeline_en = pipeline(task="text-classification", model="Hello-SimpleAI/chatgpt-detector-roberta")
+# Initialize the spell checker
+spell = SpellChecker()
 # Function to predict the label and score for English text (AI Detection)
 def predict_en(text):
     res = pipeline_en(text)[0]
     return res['label'], res['score']
+# Ensure necessary NLTK data is downloaded
 nltk.download('wordnet')
 nltk.download('omw-1.4')
+# Ensure the SpaCy model is installed
 try:
     nlp = spacy.load("en_core_web_sm")
 except OSError:
     subprocess.run(["python", "-m", "spacy", "download", "en_core_web_sm"])
     nlp = spacy.load("en_core_web_sm")
+# Function to get synonyms using NLTK WordNet
 def get_synonyms_nltk(word, pos):
     synsets = wordnet.synsets(word, pos=pos)
     if synsets:
         return [lemma.name() for lemma in lemmas]
     return []
+# Function to capitalize the first letter of sentences and proper nouns
 def capitalize_sentences_and_nouns(text):
     doc = nlp(text)
     corrected_text = []
     return ' '.join(corrected_text)
+# Function to correct tense errors in a sentence
+def correct_tense_errors(text):
+    doc = nlp(text)
+    corrected_text = []
+    for token in doc:
+        if token.pos_ == "VERB" and token.dep_ in {"aux", "auxpass"}:
+            # Replace with appropriate verb form
+            lemma = wordnet.morphy(token.text, wordnet.VERB) or token.text
+            corrected_text.append(lemma)
+        else:
+            corrected_text.append(token.text)
+    return ' '.join(corrected_text)
+# Function to correct singular/plural errors
 def correct_singular_plural_errors(text):
     doc = nlp(text)
     corrected_text = []
     return ' '.join(corrected_text)
 # Function to check and correct article errors
 def correct_article_errors(text):
     doc = nlp(text)
     if synonyms:
         synonym = synonyms[0]
+        if token.tag_ == "VBG":  # Present participle (e.g., running)
             synonym = synonym + 'ing'
+        elif token.tag_ == "VBD" or token.tag_ == "VBN":  # Past tense or past participle
             synonym = synonym + 'ed'
+        elif token.tag_ == "VBZ":  # Third-person singular present
             synonym = synonym + 's'
         return synonym
     return token.text
     corrected_text = []
     for token in doc:
         if token.dep_ == "nsubj" and token.head.pos_ == "VERB":
+            if token.tag_ == "NN" and token.head.tag_ != "VBZ":  # Singular noun, should use singular verb
                 corrected_text.append(token.head.lemma_ + "s")
+            elif token.tag_ == "NNS" and token.head.tag_ == "VBZ":  # Plural noun, should not use singular verb
                 corrected_text.append(token.head.lemma_)
         corrected_text.append(token.text)
     return ' '.join(corrected_text)
 # Function to correct spelling errors
 def correct_spelling(text):
     words = text.split()
+    corrected_words = []
+    for word in words:
+        candidates = spell.candidates(word)
+        if candidates:
+            corrected_word = spell.candidates(word).pop()
+        else:
+            corrected_word = word
+        corrected_words.append(corrected_word)
     return ' '.join(corrected_words)
+# Function to paraphrase and correct grammar
 def paraphrase_and_correct(text):
     # Capitalize first to ensure proper noun capitalization
     paraphrased_text = capitalize_sentences_and_nouns(text)