| 
					
				 | 
			
			
				@@ -337,22 +337,25 @@ def hierarchical_traversal(root_path, all_records): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 gov_commodity_jiangsu_city.process_folder(md['path']) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 def main(): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-    parser = argparse.ArgumentParser(description='海关数据智能抓取系统') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-    parser.add_argument('--year', type=int, default=None, help='终止年份(如2023),未指定时抓取最新两个月') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-    args = parser.parse_args() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-    start_time = time.time() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-    if args.year == 2023: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        log.info("正在全量采集江苏省海关数据") 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        crawl_with_selenium('http://nanjing.customs.gov.cn/nanjing_customs/zfxxgk58/fdzdgknr95/3010051/589289/7e2fcc72-1.html','all') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        duration = time.time() - start_time 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        send_dingtalk_message(f'【江苏省海关】全量数据采集完成,耗时 {duration:.2f} 秒') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-    else: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        log.info("正在增量采集江苏省海关数据") 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        res = crawl_with_selenium('http://nanjing.customs.gov.cn/nanjing_customs/zfxxgk58/fdzdgknr95/3010051/589289/7e2fcc72-1.html','auto') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        if res == 'finish': 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    try: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        parser = argparse.ArgumentParser(description='海关数据智能抓取系统') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        parser.add_argument('--year', type=int, default=None, help='终止年份(如2023),未指定时抓取最新两个月') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        args = parser.parse_args() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        start_time = time.time() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        if args.year == 2023: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            log.info("正在全量采集江苏省海关数据") 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            crawl_with_selenium('http://nanjing.customs.gov.cn/nanjing_customs/zfxxgk58/fdzdgknr95/3010051/589289/7e2fcc72-1.html','all') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             duration = time.time() - start_time 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-            send_dingtalk_message(f'【江苏省海关】增量数据采集完成,耗时 {duration:.2f} 秒') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            send_dingtalk_message(f'【江苏省海关】全量数据采集完成,耗时 {duration:.2f} 秒') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        else: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            log.info("正在增量采集江苏省海关数据") 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            res = crawl_with_selenium('http://nanjing.customs.gov.cn/nanjing_customs/zfxxgk58/fdzdgknr95/3010051/589289/7e2fcc72-1.html','auto') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+            if res == 'finish': 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                duration = time.time() - start_time 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                send_dingtalk_message(f'【江苏省海关】增量数据采集完成,耗时 {duration:.2f} 秒') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    except Exception as e: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        send_dingtalk_message(f"【江苏省海关】发生错误:{e}") 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 if __name__ == '__main__': 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     main() 
			 |