-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathscrape.py
43 lines (38 loc) · 1.12 KB
/
scrape.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
from scrapy.crawler import CrawlerProcess
from scrapy.utils.project import get_project_settings
from news_scraper.spiders import (
BusinessStandardSpider,
BusinessTodaySpider,
EconomicTimesSpider,
FinancialExpressSpider,
FirstPostSpider,
FreePressJournalSpider,
IndianExpressSpider,
MoneyControlSpider,
NDTVProfitSpider,
News18Spider,
OutlookIndiaSpider,
TheHinduBusinessLineSpider,
TheHinduSpider,
ZeeNewsSpider,
CnbcTv18Spider
)
settings = get_project_settings()
settings.update({"LOG_FILE": "scrape.log"})
process = CrawlerProcess(settings=settings)
process.crawl(BusinessStandardSpider)
process.crawl(BusinessTodaySpider)
process.crawl(EconomicTimesSpider)
process.crawl(FinancialExpressSpider)
process.crawl(FirstPostSpider)
process.crawl(FreePressJournalSpider)
# process.crawl(IndianExpressSpider)
# process.crawl(MoneyControlSpider)
process.crawl(NDTVProfitSpider)
process.crawl(News18Spider)
process.crawl(OutlookIndiaSpider)
process.crawl(TheHinduSpider)
process.crawl(TheHinduBusinessLineSpider)
process.crawl(ZeeNewsSpider)
process.crawl(CnbcTv18Spider)
process.start()