-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathrun_script.py
executable file
·29 lines (25 loc) · 1002 Bytes
/
run_script.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
from twisted.internet import reactor
from scrapy.crawler import CrawlerRunner
from scrapy.utils.log import configure_logging
from scrapy.utils.project import get_project_settings
from tophub.spiders.github_spider import GitHubSpider
from tophub.spiders.juejin_spider import JueJinSpider
from tophub.spiders.douban_spider import DouBanSpiderFiction, \
DouBanSpiderNonFiction
from tophub.spiders.reddit_spider import RedditSpider
from tophub.spiders.segmentfault_spider import SegmentFaultSpider
from tophub.spiders.hacker_news import HackerNewsSpider
configure_logging({'LOG_FORMAT': '%(levelname)s: %(message)s'})
runner = CrawlerRunner(get_project_settings())
runner.crawl(GitHubSpider)
runner.crawl(JueJinSpider)
runner.crawl(HackerNewsSpider)
runner.crawl(DouBanSpiderFiction)
runner.crawl(DouBanSpiderNonFiction)
# runner.crawl(RedditSpider)
runner.crawl(SegmentFaultSpider)
d = runner.join()
d.addBoth(lambda _: reactor.stop())
reactor.run()