无翻页系列.py 985 B

12345678910111213141516171819202122232425262728293031323334
  1. # -*- coding: utf-8 -*-
  2. # Author : Charley
  3. # Python : 3.10.8
  4. # Date : 2025/11/26 15:25
  5. import add_settings
  6. import pandas as pd
  7. series_url_list = add_settings.series_url_list
  8. # 存储不含 page_no= 的记录
  9. filtered_series = []
  10. # 遍历 series_url_list
  11. for category in series_url_list:
  12. category_name = category["category_name"]
  13. for year_data in category["years"]:
  14. year = year_data["year"]
  15. for series in year_data["series"]:
  16. series_name = series["series_name"]
  17. series_url = series["series_url"]
  18. # 判断是否含有 page_no=
  19. if "page_no=" not in series_url:
  20. filtered_series.append({
  21. "category_name": category_name,
  22. "year": year,
  23. "series_name": series_name,
  24. "series_url": series_url
  25. })
  26. # 导出到 Excel 文件
  27. df = pd.DataFrame(filtered_series)
  28. df.to_excel("series_without.xlsx", index=False)