Spaces:
Running
Running
Update src/documentProcessing.py
Browse files
src/documentProcessing.py
CHANGED
@@ -1,6 +1,11 @@
|
|
1 |
import docx
|
2 |
import PyPDF2
|
|
|
|
|
|
|
|
|
3 |
import tempfile
|
|
|
4 |
|
5 |
def extract_text_from_pdf(pdf_path):
|
6 |
text = ""
|
|
|
1 |
import docx
|
2 |
import PyPDF2
|
3 |
+
import os
|
4 |
+
import re
|
5 |
+
import json
|
6 |
+
import time
|
7 |
import tempfile
|
8 |
+
from typing import Dict, Any, List, Optional
|
9 |
|
10 |
def extract_text_from_pdf(pdf_path):
|
11 |
text = ""
|