MrSimple01 commited on
Commit
bcf9fd7
·
verified ·
1 Parent(s): 3a765ef

Update src/documentProcessing.py

Browse files
Files changed (1) hide show
  1. src/documentProcessing.py +5 -0
src/documentProcessing.py CHANGED
@@ -1,6 +1,11 @@
1
  import docx
2
  import PyPDF2
 
 
 
 
3
  import tempfile
 
4
 
5
  def extract_text_from_pdf(pdf_path):
6
  text = ""
 
1
  import docx
2
  import PyPDF2
3
+ import os
4
+ import re
5
+ import json
6
+ import time
7
  import tempfile
8
+ from typing import Dict, Any, List, Optional
9
 
10
  def extract_text_from_pdf(pdf_path):
11
  text = ""