diff options
-rw-r--r-- | Makefile | 10 | ||||
-rw-r--r-- | commcrawler/models.py | 5 | ||||
-rw-r--r-- | fixtures/commcrawler.json | 8 |
3 files changed, 20 insertions, 3 deletions
@@ -30,14 +30,20 @@ collectstatic: ## web - collect static files to serve update: collectstatic compilemessages migrate ## update echo "OK" +fixture: ## create fixtures (excluded domains) + $(PYTHON) manage.py dumpdata --indent 4 --natural-primary \ + commcrawler.ExludedDomains > fixtures/commcrawler.json + +install_fixture: ## install fixtures (excluded domains) + $(PYTHON) manage.py loaddata fixtures/commcrawler.json + default_import: ## import default data $(PYTHON) manage.py import_csv_communes data_src/communes.csv $(PYTHON) manage.py import_csv_autres data_src/autres.csv -regenerate_all: migrate default_import ## regenerate all the database +regenerate_all: migrate default_import install_fixture ## regenerate all the database $(PYTHON) manage.py createsuperuser - crawl: ## launch crawl on the first planified crawler $(PYTHON) manage.py launch_crawl --first-available diff --git a/commcrawler/models.py b/commcrawler/models.py index b520b09..ca26ec1 100644 --- a/commcrawler/models.py +++ b/commcrawler/models.py @@ -18,7 +18,10 @@ class ExludedDomains(models.Model): verbose_name_plural = _("Excluded domains") def __str__(self): - return self.url + return self.domain + + def natural_key(self): + return self.domain class Crawl(models.Model): diff --git a/fixtures/commcrawler.json b/fixtures/commcrawler.json new file mode 100644 index 0000000..8ec419b --- /dev/null +++ b/fixtures/commcrawler.json @@ -0,0 +1,8 @@ +[ +{ + "model": "commcrawler.exludeddomains", + "fields": { + "domain": "hugedomains.com" + } +} +] |