Spaces:

ozgurunlu
/

m-check

Sleeping

App Files Files Community

Ozgur Unlu commited on Nov 6, 2024

Commit

a7de25c

1 Parent(s): 72d5e40

error fixes for grammar check

Browse files

Files changed (2) hide show

app.py +25 -17
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ import os
 from pdf_generator import ReportGenerator
 from news_checker import NewsChecker
 from dotenv import load_dotenv
-import language_tool_python  # For spell checking
 load_dotenv()
@@ -20,11 +20,11 @@ def load_models():
     hate_model = AutoModelForSequenceClassification.from_pretrained(model_name)
     # Initialize spell checker
-    spell_tool = language_tool_python.LanguageTool('en-US')
     return {
         'hate_speech': (hate_model, hate_tokenizer),
-        'spell_check': spell_tool
     }
 # Initialize news checker
@@ -68,23 +68,31 @@ def check_hate_speech_and_bias(text, model, tokenizer):
             'message': f'Error in hate speech/bias detection: {str(e)}'
         }
-def check_spelling(text, spell_tool):
     try:
-        matches = spell_tool.check(text)
-        spelling_errors = []
-        for match in matches:
-            if match.ruleId in ['MORFOLOGIK_RULE_EN_US', 'TYPOS']:  # Only check spelling errors
-                error_word = text[match.offset:match.offset + match.errorLength]
-                suggestions = match.replacements[:3]  # Limit to top 3 suggestions
-                if suggestions:
-                    spelling_errors.append(f"'{error_word}' -> suggestions: {', '.join(suggestions)}")
-        if spelling_errors:
-            return {
-                'status': 'warning',
-                'message': 'Misspelled words found:\n' + '\n'.join(spelling_errors)
-            }
         return {
             'status': 'pass',
             'message': 'No spelling errors detected'

 from pdf_generator import ReportGenerator
 from news_checker import NewsChecker
 from dotenv import load_dotenv
+from spellchecker import SpellChecker
 load_dotenv()
     hate_model = AutoModelForSequenceClassification.from_pretrained(model_name)
     # Initialize spell checker
+    spell = SpellChecker()
     return {
         'hate_speech': (hate_model, hate_tokenizer),
+        'spell_check': spell
     }
 # Initialize news checker
             'message': f'Error in hate speech/bias detection: {str(e)}'
         }
+def check_spelling(text, spell_checker):
     try:
+        # Split text into words and clean them
+        words = text.replace('\n', ' ').split()
+        words = [word.strip('.,!?()[]{}":;') for word in words]
+        # Find misspelled words
+        misspelled = spell_checker.unknown(words)
+        if misspelled:
+            corrections = []
+            for word in misspelled:
+                # Get the most likely corrections
+                candidates = spell_checker.candidates(word)
+                if candidates:
+                    # Take up to 3 suggestions
+                    suggestions = list(candidates)[:3]
+                    corrections.append(f"'{word}' -> suggestions: {', '.join(suggestions)}")
+            if corrections:
+                return {
+                    'status': 'warning',
+                    'message': 'Misspelled words found:\n' + '\n'.join(corrections)
+                }
         return {
             'status': 'pass',
             'message': 'No spelling errors detected'

requirements.txt CHANGED Viewed

@@ -8,4 +8,4 @@ pandas==2.1.4
 numpy==1.24.3
 requests==2.31.0
 python-dotenv==1.0.0
-language-tool-python==2.7.1

 numpy==1.24.3
 requests==2.31.0
 python-dotenv==1.0.0
+spellchecker==0.7.2