nlpblogs commited on
Commit
0e0978c
·
verified ·
1 Parent(s): cef76db

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +31 -1
app.py CHANGED
@@ -43,7 +43,24 @@ if uploaded_files1:
43
  text_data = ""
44
  for page in pdf_reader.pages:
45
  text_data += page.extract_text()
46
- all_resumes_text1.append(text_data)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  except Exception as e:
48
  st.error(f"Error processing file {uploaded_file.name}: {e}")
49
 
@@ -86,6 +103,19 @@ if uploaded_files2:
86
  text_data = ""
87
  for page in pdf_reader.pages:
88
  text_data += page.extract_text()
 
 
 
 
 
 
 
 
 
 
 
 
 
89
  all_resumes_text2.append(text_data)
90
  except Exception as e:
91
  st.error(f"Error processing file {uploaded_file.name}: {e}")
 
43
  text_data = ""
44
  for page in pdf_reader.pages:
45
  text_data += page.extract_text()
46
+ model = GLiNER.from_pretrained("urchade/gliner_base")
47
+ labels = ["person", "country", "organization", "time", "role"]
48
+ entities = model.predict_entities(text_data, labels)
49
+
50
+ entity_dict = {}
51
+ for label in labels:
52
+ entity_dict[label] = [entity["text"] for entity in entities if entity["label"] == label]
53
+
54
+ data = {"Text": text_data, **entity_dict}
55
+
56
+
57
+
58
+
59
+
60
+
61
+
62
+
63
+ all_resumes_text1.append(data)
64
  except Exception as e:
65
  st.error(f"Error processing file {uploaded_file.name}: {e}")
66
 
 
103
  text_data = ""
104
  for page in pdf_reader.pages:
105
  text_data += page.extract_text()
106
+ model = GLiNER.from_pretrained("urchade/gliner_base")
107
+ labels = ["person", "country", "organization", "time", "role"]
108
+ entities = model.predict_entities(text_data, labels)
109
+
110
+ entity_dict = {}
111
+ for label in labels:
112
+ entity_dict[label] = [entity["text"] for entity in entities if entity["label"] == label]
113
+
114
+ data = {"Text": text_data, **entity_dict}
115
+
116
+
117
+
118
+
119
  all_resumes_text2.append(text_data)
120
  except Exception as e:
121
  st.error(f"Error processing file {uploaded_file.name}: {e}")