Spaces:

manasagangotri
/

classify

Running

manasagangotri commited on Nov 1, 2024

Commit

8c09499

verified ·

1 Parent(s): ea25a6f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,7 +3,13 @@ from modules.parse_pdf import process_pdf
 from modules.classify import classify_text_multi  # Importing BERT model classification
 from modules.RandomForest import classify_text_rf,classify_text_rf_multi #Importing single and multi-label classification
 from modules.SVM import classify_text_svm,classify_text_svm_multi #Importing single and multi-label classification
 # Function to process and classify PDF using both BERT and Random Forest models
 def process_and_classify_pdf(file):
     # Step 1: Process the PDF to extract and clean the text

 from modules.classify import classify_text_multi  # Importing BERT model classification
 from modules.RandomForest import classify_text_rf,classify_text_rf_multi #Importing single and multi-label classification
 from modules.SVM import classify_text_svm,classify_text_svm_multi #Importing single and multi-label classification
+import nltk
+# Check if the stopwords resource is available; if not, download it
+try:
+    nltk.data.find('corpora/stopwords')
+except LookupError:
+    nltk.download('stopwords')
 # Function to process and classify PDF using both BERT and Random Forest models
 def process_and_classify_pdf(file):
     # Step 1: Process the PDF to extract and clean the text