Muhammad Abdur Rahman Saad
commited on
Commit
·
8107bcc
1
Parent(s):
fa7a873
daily.yml debug
Browse files- .github/workflows/daily.yml +2 -2
- .gitignore +3 -1
- utils.py +2 -0
.github/workflows/daily.yml
CHANGED
@@ -34,8 +34,8 @@ jobs:
|
|
34 |
pip uninstall transformers -y
|
35 |
pip install transformers
|
36 |
pip install tensorflow
|
37 |
-
|
38 |
-
pip install
|
39 |
- name: Data Collection
|
40 |
env:
|
41 |
AWS_ACCESS_KEY_ID: ${{ secrets.AWS_ACCESS_KEY_ID }}
|
|
|
34 |
pip uninstall transformers -y
|
35 |
pip install transformers
|
36 |
pip install tensorflow
|
37 |
+
pip install tf-keras
|
38 |
+
pip install python-dotenv
|
39 |
- name: Data Collection
|
40 |
env:
|
41 |
AWS_ACCESS_KEY_ID: ${{ secrets.AWS_ACCESS_KEY_ID }}
|
.gitignore
CHANGED
@@ -1,4 +1,6 @@
|
|
1 |
-
env
|
|
|
|
|
2 |
__pycache__
|
3 |
downloaded_file.pdf
|
4 |
downloaded_file.docx
|
|
|
1 |
+
.env
|
2 |
+
data
|
3 |
+
venv
|
4 |
__pycache__
|
5 |
downloaded_file.pdf
|
6 |
downloaded_file.docx
|
utils.py
CHANGED
@@ -13,11 +13,13 @@ import pandas as pd
|
|
13 |
import requests
|
14 |
import boto3
|
15 |
from lxml import etree
|
|
|
16 |
from googletrans import Translator
|
17 |
from transformers import pipeline
|
18 |
from PyPDF2 import PdfReader
|
19 |
from langdetect import detect
|
20 |
|
|
|
21 |
AWS_ACCESS_KEY_ID = os.environ['AWS_ACCESS_KEY_ID']
|
22 |
AWS_SECRET_ACCESS_KEY = os.environ['AWS_SECRET_ACCESS_KEY']
|
23 |
|
|
|
13 |
import requests
|
14 |
import boto3
|
15 |
from lxml import etree
|
16 |
+
from dotenv import load_dotenv
|
17 |
from googletrans import Translator
|
18 |
from transformers import pipeline
|
19 |
from PyPDF2 import PdfReader
|
20 |
from langdetect import detect
|
21 |
|
22 |
+
load_dotenv()
|
23 |
AWS_ACCESS_KEY_ID = os.environ['AWS_ACCESS_KEY_ID']
|
24 |
AWS_SECRET_ACCESS_KEY = os.environ['AWS_SECRET_ACCESS_KEY']
|
25 |
|