nlpblogs commited on
Commit
aa023ef
·
verified ·
1 Parent(s): f8761ad

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -21
app.py CHANGED
@@ -1,24 +1,14 @@
1
  import streamlit as st
2
  from PyPDF2 import PdfReader
3
 
4
- import streamlit as st
5
- import pandas as pd
6
- from io import StringIO
7
-
8
- uploaded_file = st.file_uploader("Choose a file")
9
- if uploaded_file is not None:
10
- # To read file as bytes:
11
- bytes_data = uploaded_file.getvalue()
12
- st.write(bytes_data)
13
-
14
- # To convert to a string based IO:
15
- stringio = StringIO(uploaded_file.getvalue().decode("utf-8"))
16
- st.write(stringio)
17
-
18
- # To read file as string:
19
- string_data = stringio.read()
20
- st.write(string_data)
21
-
22
- # Can be used wherever a "file-like" object is accepted:
23
- dataframe = pd.read_csv(uploaded_file)
24
- st.write(dataframe)
 
1
  import streamlit as st
2
  from PyPDF2 import PdfReader
3
 
4
+ uploaded_files = st.file_uploader(
5
+ "Choose a CSV file", type="pdf"
6
+ )
7
+ for uploaded_file in uploaded_files:
8
+ pdf_reader = PdfReader(uploaded_files) # read your PDF file
9
+ # extract the text data from your PDF file after looping through its pages with the .extract_text() method
10
+ text_data= ""
11
+ for page in pdf_reader.pages: # for loop method
12
+ text_data+= page.extract_text()
13
+
14
+ st.write(text_data) # view the text data