summaryrefslogtreecommitdiff
path: root/commcrawler/management/commands/launch_crawl.py
blob: 050a54d327e5e9c3bdb310398e2ffc5f4ffb89b6 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
import csv
import sys

from django.core.management.base import BaseCommand

from commcrawler.models import Crawl
from commcrawler.scrapy import launch_crawl


class Command(BaseCommand):
    help = 'Launch a crawl'

    def add_arguments(self, parser):
        parser.add_argument(
            '--quiet', dest='quiet', action='store_true',
            help='Quiet output')

    def handle(self, *args, **options):
        quiet = options['quiet']
        q = Crawl.objects.filter(status="C")
        if not q.count():
            sys.stdout.write('No crawl waiting. Exit.\n')
            return

        crawls = dict([(c.pk, c) for c in q.all()])
        available_ids = crawls.keys()
        c_id = None
        while c_id not in available_ids:
            sys.stdout.write('Which crawl to launch (type the number):\n')
            for crawl_id, crawl in crawls.items():
                sys.stdout.write('* {} - {}\n'.format(crawl_id, crawl))
                sys.stdout.flush()
            try:
                c_id = int(input("# "))
            except ValueError:
                c_id = None
        current_crawl = crawls[c_id]
        launch_crawl(current_crawl)