summaryrefslogtreecommitdiff
path: root/commcrawler/scrapy.py
diff options
context:
space:
mode:
Diffstat (limited to 'commcrawler/scrapy.py')
-rw-r--r--commcrawler/scrapy.py7
1 files changed, 3 insertions, 4 deletions
diff --git a/commcrawler/scrapy.py b/commcrawler/scrapy.py
index 5fbeb43..8c78e61 100644
--- a/commcrawler/scrapy.py
+++ b/commcrawler/scrapy.py
@@ -33,6 +33,9 @@ CALENDAR_KEYS = ["agenda", "calendar"]
MAX_LINKS = None # if None no max
TIMEOUT = datetime.timedelta(minutes=settings.CRAWL_TIMEOUT)
+NUMBER_PER_PAGE = settings.NUMBER_PER_SESSION
+ONLY_FIRST_PAGE = True
+
class DefaultSpider:
name = None
@@ -317,10 +320,6 @@ def update_db_result(result_dct, values):
result.save()
-NUMBER_PER_PAGE = 250
-ONLY_FIRST_PAGE = True
-
-
def launch_crawl(crawl_item, excluded_domains=None):
scrap_settings = settings.SCRAPPY_SETTINGS.copy()
crawl_item.started = timezone.now()