|
@@ -337,22 +337,25 @@ def hierarchical_traversal(root_path, all_records):
|
|
gov_commodity_jiangsu_city.process_folder(md['path'])
|
|
gov_commodity_jiangsu_city.process_folder(md['path'])
|
|
|
|
|
|
def main():
|
|
def main():
|
|
- parser = argparse.ArgumentParser(description='海关数据智能抓取系统')
|
|
|
|
- parser.add_argument('--year', type=int, default=None, help='终止年份(如2023),未指定时抓取最新两个月')
|
|
|
|
- args = parser.parse_args()
|
|
|
|
-
|
|
|
|
- start_time = time.time()
|
|
|
|
- if args.year == 2023:
|
|
|
|
- log.info("正在全量采集江苏省海关数据")
|
|
|
|
- crawl_with_selenium('http://nanjing.customs.gov.cn/nanjing_customs/zfxxgk58/fdzdgknr95/3010051/589289/7e2fcc72-1.html','all')
|
|
|
|
- duration = time.time() - start_time
|
|
|
|
- send_dingtalk_message(f'【江苏省海关】全量数据采集完成,耗时 {duration:.2f} 秒')
|
|
|
|
- else:
|
|
|
|
- log.info("正在增量采集江苏省海关数据")
|
|
|
|
- res = crawl_with_selenium('http://nanjing.customs.gov.cn/nanjing_customs/zfxxgk58/fdzdgknr95/3010051/589289/7e2fcc72-1.html','auto')
|
|
|
|
- if res == 'finish':
|
|
|
|
|
|
+ try:
|
|
|
|
+ parser = argparse.ArgumentParser(description='海关数据智能抓取系统')
|
|
|
|
+ parser.add_argument('--year', type=int, default=None, help='终止年份(如2023),未指定时抓取最新两个月')
|
|
|
|
+ args = parser.parse_args()
|
|
|
|
+
|
|
|
|
+ start_time = time.time()
|
|
|
|
+ if args.year == 2023:
|
|
|
|
+ log.info("正在全量采集江苏省海关数据")
|
|
|
|
+ crawl_with_selenium('http://nanjing.customs.gov.cn/nanjing_customs/zfxxgk58/fdzdgknr95/3010051/589289/7e2fcc72-1.html','all')
|
|
duration = time.time() - start_time
|
|
duration = time.time() - start_time
|
|
- send_dingtalk_message(f'【江苏省海关】增量数据采集完成,耗时 {duration:.2f} 秒')
|
|
|
|
|
|
+ send_dingtalk_message(f'【江苏省海关】全量数据采集完成,耗时 {duration:.2f} 秒')
|
|
|
|
+ else:
|
|
|
|
+ log.info("正在增量采集江苏省海关数据")
|
|
|
|
+ res = crawl_with_selenium('http://nanjing.customs.gov.cn/nanjing_customs/zfxxgk58/fdzdgknr95/3010051/589289/7e2fcc72-1.html','auto')
|
|
|
|
+ if res == 'finish':
|
|
|
|
+ duration = time.time() - start_time
|
|
|
|
+ send_dingtalk_message(f'【江苏省海关】增量数据采集完成,耗时 {duration:.2f} 秒')
|
|
|
|
+ except Exception as e:
|
|
|
|
+ send_dingtalk_message(f"【江苏省海关】发生错误:{e}")
|
|
|
|
|
|
if __name__ == '__main__':
|
|
if __name__ == '__main__':
|
|
main()
|
|
main()
|