浏览代码

feat(spider): 优化定时任务时间及增加页面获取日志

- 调整 bidding_main 定时任务触发时间从08:01改为05:01
- 调整 sold_main 定时任务触发时间从10:01改为07:01
- 注释掉初始时立即运行的任务调用,防止重复执行
- weika_sold_spider 增加页码循环中获取页数据的日志输出,便于调试与监控
charley 1 月之前
父节点
当前提交
398f0560b6
共有 2 个文件被更改,包括 6 次插入5 次删除
  1. 1 0
      weikajia_spider/weika_sold_spider.py
  2. 5 5
      weikajia_spider/weika_spider.py

+ 1 - 0
weikajia_spider/weika_sold_spider.py

@@ -184,6 +184,7 @@ def fetch_all_pages(log):
     pages = (total + 9) // 10  # 计算页码
     log.info(f"一共有{total}条已售数据, 总页数: {pages}..................................")
     for page in range(1, pages + 1):
+        log.info(f"正在获取第{page}页数据..................")
         data = {
             "page": page,
             "pageSize": 10,

+ 5 - 5
weikajia_spider/weika_spider.py

@@ -36,18 +36,18 @@ def schedule_task():
     change_card_main
     """
     # 立即运行一次任务
-    run_threaded(bidding_main, log=logger)
-    run_threaded(change_card_main, log=logger)
-    run_threaded(sold_main, log=logger)
+    # run_threaded(bidding_main, log=logger)
+    # run_threaded(change_card_main, log=logger)
+    # run_threaded(sold_main, log=logger)
     # bidding_main(log=logger)
     # change_card_main(log=logger)
     # sold_main(log=logger)
 
     # 设置定时任务
     # schedule.every().day.at("00:00").do(run_threaded,clean_logs)
-    schedule.every().day.at("08:01").do(run_threaded, bidding_main, log=logger)
+    schedule.every().day.at("05:01").do(run_threaded, bidding_main, log=logger)
     schedule.every().day.at("00:01").do(run_threaded, change_card_main, log=logger)
-    schedule.every().day.at("10:01").do(run_threaded, sold_main, log=logger)
+    schedule.every().day.at("07:01").do(run_threaded, sold_main, log=logger)
     while True:
         schedule.run_pending()
         time.sleep(1)