From 4992631aef19d7f644cbcd6cd5e37dde37c6e149 Mon Sep 17 00:00:00 2001 From: cloudroam <cloudroam> Date: 星期一, 14 七月 2025 10:46:10 +0800 Subject: [PATCH] add:增加对外接口 --- douban.py | 11 ++++++++++- 1 files changed, 10 insertions(+), 1 deletions(-) diff --git a/douban.py b/douban.py index 3608f81..9b00899 100644 --- a/douban.py +++ b/douban.py @@ -1,7 +1,16 @@ from douban_tv import DoubanTVSpider from scrapy.crawler import CrawlerProcess +import sys if __name__ == "__main__": + # 获取命令行参数 + type_ = "tv" + tag = "热门" + if len(sys.argv) > 1: + type_ = sys.argv[1] + if len(sys.argv) > 2: + tag = sys.argv[2] + process = CrawlerProcess(settings={ "USER_AGENT": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 Chrome/112.0.0.0 Safari/537.36", "DOWNLOAD_DELAY": 2, @@ -9,5 +18,5 @@ "ROBOTSTXT_OBEY": False, "LOG_LEVEL": "INFO" }) - process.crawl(DoubanTVSpider) + process.crawl(DoubanTVSpider, type_=type_, tag=tag) process.start() \ No newline at end of file -- Gitblit v1.9.3