|
@@ -16,6 +16,7 @@ from crossborder.utils.db_helper import DBHelper
|
|
|
from crossborder.guangdong.guangdong_sub_customs_parse_excel import parse_excel
|
|
|
from crossborder.utils.constants import DOWNLOAD_DIR
|
|
|
from crossborder.utils.constants import GUANGDONG_CUSTOMS_URL
|
|
|
+from crossborder.utils.dingtalk import send_dingtalk_message
|
|
|
from crossborder.utils.download_utils import configure_stealth_options, generate_month_sequence, download_excel, download_excel2, \
|
|
|
batch_download_excel
|
|
|
from crossborder.utils.log import get_logger
|
|
@@ -262,10 +263,12 @@ def random_sleep(base=2, variance=5):
|
|
|
|
|
|
def main():
|
|
|
"""主入口(优化参数处理逻辑)"""
|
|
|
+ global target_months
|
|
|
parser = argparse.ArgumentParser(description='海关数据智能抓取系统')
|
|
|
parser.add_argument('--year', type=int, default=None,
|
|
|
help='终止年份(如2023),未指定时抓取最新两个月')
|
|
|
args = parser.parse_args()
|
|
|
+ start_time = time.time()
|
|
|
driver = webdriver.Firefox(options=configure_stealth_options(download_dir))
|
|
|
for customs_name in GUANGDONG_CUSTOMS_URL.keys():
|
|
|
try:
|
|
@@ -304,6 +307,12 @@ def main():
|
|
|
db_helper = DBHelper()
|
|
|
db_helper.update_prov_yoy("广东省")
|
|
|
log.info("\n广东省地级市数据同比更新结束")
|
|
|
+ duration = time.time() - start_time
|
|
|
+ minutes, seconds = divmod(duration, 60) # 转换为分钟和秒
|
|
|
+ message = f'【广东省-广州海关、深圳海关、拱北海关、汕头海关、江门海关、黄埔海关、湛江海关】{len(target_months)}个月份数据已采集完毕,总耗时:{int(minutes)}分{seconds:.1f}秒'
|
|
|
+ send_dingtalk_message(message)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
- main()
|
|
|
+ main()
|
|
|
+ # db_helper = DBHelper()
|
|
|
+ # db_helper.update_prov_yoy("广东省")
|