diff options
author | neodarz <neodarz@neodarz.net> | 2019-01-19 00:02:57 +0100 |
---|---|---|
committer | neodarz <neodarz@neodarz.net> | 2019-01-19 00:02:57 +0100 |
commit | a3f01580faf6caee4abcc8e682567b87380857b9 (patch) | |
tree | dbf5e0a9866b3aac7e7bb64f2eab8c005e1c28cd /crawler/neodarznet/spiders/scrape.py | |
parent | 073e919ef198a04da1e5ed28a7dfbc5d9681fc14 (diff) | |
download | khanindexer-a3f01580faf6caee4abcc8e682567b87380857b9.tar.xz khanindexer-a3f01580faf6caee4abcc8e682567b87380857b9.zip |
Add khanindex nevrax indexation
Diffstat (limited to '')
-rw-r--r-- | crawler/neodarznet/spiders/scrape.py | 9 |
1 files changed, 7 insertions, 2 deletions
diff --git a/crawler/neodarznet/spiders/scrape.py b/crawler/neodarznet/spiders/scrape.py index a32a3e4..e16ede2 100644 --- a/crawler/neodarznet/spiders/scrape.py +++ b/crawler/neodarznet/spiders/scrape.py @@ -4,8 +4,13 @@ from scrapy.spiders import CrawlSpider, Rule from scrapy.linkextractors import LinkExtractor from scrapy import Selector -class ScrapSpider(CrawlSpider): - name = "scrape" +class NeodarznetSpider(CrawlSpider): + name = "neodarznet" + custom_settings = { + 'ITEM_PIPELINES': { + 'crawler.neodarznet.pipelines.NeodarznetPipeline': 0 + } + } allow_domains = ['neodarz.net'] start_urls = [ 'https://neodarz.net/', |