hackerbyhobby commited on
Commit
f7e3939
·
unverified ·
1 Parent(s): c289167

updated url regex

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -282,7 +282,7 @@ def smishing_detector(input_type, text, image):
282
  lower_text = combined_text.lower()
283
  smishing_keys, scam_keys, _ = get_keywords_by_language(combined_text)
284
 
285
- found_urls = re.findall(r"(https?://[^\s]+)", lower_text)
286
  found_smishing = [kw for kw in smishing_keys if kw in lower_text]
287
  found_other_scam = [kw for kw in scam_keys if kw in lower_text]
288
 
 
282
  lower_text = combined_text.lower()
283
  smishing_keys, scam_keys, _ = get_keywords_by_language(combined_text)
284
 
285
+ found_urls = re.findall(r"(https?://[^\s]+|\b(?:[a-zA-Z0-9.-]+\.(?:com|net|org|edu|gov|mil|io|ai|co|info|biz|us|uk|de|fr|es|ru|jp|cn|in|au|ca|br|mx|it|nl|se|no|fi|ch|pl|kr|vn|id|tw|sg|hk))\b)", lower_text)
286
  found_smishing = [kw for kw in smishing_keys if kw in lower_text]
287
  found_other_scam = [kw for kw in scam_keys if kw in lower_text]
288