huamnifierWithSimpleGrammer

Running

App Files Files

sashtech commited on Sep 2, 2024

Commit

ae10f26

verified ·

1 Parent(s): 3fa7f9a

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -8

app.py CHANGED Viewed

@@ -1,13 +1,11 @@
 import gradio as gr
-from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import torch
 import spacy
 import subprocess
 import nltk
-import gingerit
 from nltk.corpus import wordnet
 from gensim import downloader as api
-from gingerit.gingerit import GingerIt  # Import GingerIt for grammar correction
 # Ensure necessary NLTK data is downloaded
 nltk.download('wordnet')
@@ -30,6 +28,9 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english")
 model = AutoModelForSequenceClassification.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english").to(device)
 # AI detection function using DistilBERT
 def detect_ai_generated(text):
     inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=512).to(device)
@@ -47,7 +48,7 @@ def get_synonyms_nltk(word, pos):
         return [lemma.name() for lemma in lemmas]
     return []
-# Paraphrasing function using spaCy and NLTK (without grammar correction)
 def paraphrase_with_spacy_nltk(text):
     doc = nlp(text)
     paraphrased_words = []
@@ -77,11 +78,10 @@ def paraphrase_with_spacy_nltk(text):
     return paraphrased_sentence
-# Grammar correction function using GingerIt
 def correct_grammar(text):
-    parser = GingerIt()
-    result = parser.parse(text)
-    return result['result']  # Return the corrected text
 # Combined function: Paraphrase -> Grammar Check
 def paraphrase_and_correct(text):

 import gradio as gr
+from transformers import AutoTokenizer, AutoModelForSequenceClassification, pipeline
 import torch
 import spacy
 import subprocess
 import nltk
 from nltk.corpus import wordnet
 from gensim import downloader as api
 # Ensure necessary NLTK data is downloaded
 nltk.download('wordnet')
 tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english")
 model = AutoModelForSequenceClassification.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english").to(device)
+# Load grammar correction model from Hugging Face
+grammar_corrector = pipeline("text2text-generation", model="vennify/t5-base-grammar-correction", device=0 if torch.cuda.is_available() else -1)
 # AI detection function using DistilBERT
 def detect_ai_generated(text):
     inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=512).to(device)
         return [lemma.name() for lemma in lemmas]
     return []
+# Paraphrasing function using spaCy and NLTK
 def paraphrase_with_spacy_nltk(text):
     doc = nlp(text)
     paraphrased_words = []
     return paraphrased_sentence
+# Grammar correction function using the Hugging Face model
 def correct_grammar(text):
+    corrected_text = grammar_corrector(text)[0]['generated_text']
+    return corrected_text
 # Combined function: Paraphrase -> Grammar Check
 def paraphrase_and_correct(text):