Spaces:

Oxbridge-Economics
/

Data-Collection-China

Running

Muhammad Abdur Rahman Saad commited on Aug 9, 2024

Commit

4c3d51c

1 Parent(s): 0b8b219

Update daily.py

Files changed (1) hide show

daily.py CHANGED Viewed

@@ -10,7 +10,6 @@ import urllib.request
 import uuid
 from datetime import datetime, timedelta
 from urllib.parse import urlparse
-from prefect import flow, task
 from lxml import etree
 from glue import glue_job_run
@@ -18,7 +17,6 @@ from utils import (crawl, datemodifier, encode, encode_content,
                    extract_from_pdf, extract_reference, fetch_url,
                    sentiment_computation, translate, update_content)
-@task(name = "crawl_eastmoney")
 def crawl_eastmoney(url, article):
     """
     Crawls the given URL and extracts information from the webpage.
@@ -66,7 +64,6 @@ def crawl_eastmoney(url, article):
     extract_reference(article)
     update_content(article)
-@task(name = "data collection")
 def daily():
     with open('xpath.json', 'r', encoding='UTF-8') as f:
         xpath_dict = json.load(f)
@@ -525,7 +522,7 @@ def daily():
                         except Exception as error:
                             print(error)
-@flow(name = "Data Collection China - Daily", log_prints=True)
 def data_collection():
     daily()
     glue_job_run()

 import uuid
 from datetime import datetime, timedelta
 from urllib.parse import urlparse
 from lxml import etree
 from glue import glue_job_run
                    extract_from_pdf, extract_reference, fetch_url,
                    sentiment_computation, translate, update_content)
 def crawl_eastmoney(url, article):
     """
     Crawls the given URL and extracts information from the webpage.
     extract_reference(article)
     update_content(article)
 def daily():
     with open('xpath.json', 'r', encoding='UTF-8') as f:
         xpath_dict = json.load(f)
                         except Exception as error:
                             print(error)
 def data_collection():
     daily()
     glue_job_run()