huamnifierWithSimpleGrammer

Running

App Files Files

sashtech commited on Sep 2, 2024

Commit

cdd9b28

verified ·

1 Parent(s): e9b5c2e

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -14

app.py CHANGED Viewed

@@ -5,8 +5,7 @@ import spacy
 import subprocess
 import nltk
 from nltk.corpus import wordnet
-from gingerit.gingerit import GingerIt
 from gensim import downloader as api
 # Ensure necessary NLTK data is downloaded
@@ -30,15 +29,12 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english")
 model = AutoModelForSequenceClassification.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english").to(device)
-# Initialize Gingerit for grammar correction
-def correct_grammar_with_gingerit(text):
-    try:
-        parser = GingerIt()
-        result = parser.parse(text)
-        return result['result']
-    except Exception as e:
-        print(f"Error in Gingerit grammar correction: {e}")
-        return text  # Return the original text if Gingerit fails
 # AI detection function using DistilBERT
 def detect_ai_generated(text):
@@ -57,7 +53,7 @@ def get_synonyms_nltk(word, pos):
         return [lemma.name() for lemma in lemmas]
     return []
-# Paraphrasing function using spaCy and NLTK with Gingerit grammar correction
 def paraphrase_with_spacy_nltk(text):
     doc = nlp(text)
     paraphrased_words = []
@@ -85,8 +81,8 @@ def paraphrase_with_spacy_nltk(text):
     # Join the words back into a sentence
     paraphrased_sentence = ' '.join(paraphrased_words)
-    # Correct the grammar of the paraphrased sentence using Gingerit
-    corrected_sentence = correct_grammar_with_gingerit(paraphrased_sentence)
     return corrected_sentence

 import subprocess
 import nltk
 from nltk.corpus import wordnet
+import language_tool_python  # Import language-tool-python for grammar correction
 from gensim import downloader as api
 # Ensure necessary NLTK data is downloaded
 tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english")
 model = AutoModelForSequenceClassification.from_pretrained("distilbert-base-uncased-finetuned-sst-2-english").to(device)
+# Function to correct grammar using language-tool-python
+def correct_grammar_with_language_tool(text):
+    tool = language_tool_python.LanguageTool('en-US')
+    matches = tool.check(text)
+    corrected_text = language_tool_python.utils.correct(text, matches)
+    return corrected_text
 # AI detection function using DistilBERT
 def detect_ai_generated(text):
         return [lemma.name() for lemma in lemmas]
     return []
+# Paraphrasing function using spaCy and NLTK with grammar correction
 def paraphrase_with_spacy_nltk(text):
     doc = nlp(text)
     paraphrased_words = []
     # Join the words back into a sentence
     paraphrased_sentence = ' '.join(paraphrased_words)
+    # Correct the grammar of the paraphrased sentence using language-tool-python
+    corrected_sentence = correct_grammar_with_language_tool(paraphrased_sentence)
     return corrected_sentence