summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--Makefile10
-rw-r--r--commcrawler/models.py5
-rw-r--r--fixtures/commcrawler.json8
3 files changed, 20 insertions, 3 deletions
diff --git a/Makefile b/Makefile
index 270eca1..5401331 100644
--- a/Makefile
+++ b/Makefile
@@ -30,14 +30,20 @@ collectstatic: ## web - collect static files to serve
update: collectstatic compilemessages migrate ## update
echo "OK"
+fixture: ## create fixtures (excluded domains)
+ $(PYTHON) manage.py dumpdata --indent 4 --natural-primary \
+ commcrawler.ExludedDomains > fixtures/commcrawler.json
+
+install_fixture: ## install fixtures (excluded domains)
+ $(PYTHON) manage.py loaddata fixtures/commcrawler.json
+
default_import: ## import default data
$(PYTHON) manage.py import_csv_communes data_src/communes.csv
$(PYTHON) manage.py import_csv_autres data_src/autres.csv
-regenerate_all: migrate default_import ## regenerate all the database
+regenerate_all: migrate default_import install_fixture ## regenerate all the database
$(PYTHON) manage.py createsuperuser
-
crawl: ## launch crawl on the first planified crawler
$(PYTHON) manage.py launch_crawl --first-available
diff --git a/commcrawler/models.py b/commcrawler/models.py
index b520b09..ca26ec1 100644
--- a/commcrawler/models.py
+++ b/commcrawler/models.py
@@ -18,7 +18,10 @@ class ExludedDomains(models.Model):
verbose_name_plural = _("Excluded domains")
def __str__(self):
- return self.url
+ return self.domain
+
+ def natural_key(self):
+ return self.domain
class Crawl(models.Model):
diff --git a/fixtures/commcrawler.json b/fixtures/commcrawler.json
new file mode 100644
index 0000000..8ec419b
--- /dev/null
+++ b/fixtures/commcrawler.json
@@ -0,0 +1,8 @@
+[
+{
+ "model": "commcrawler.exludeddomains",
+ "fields": {
+ "domain": "hugedomains.com"
+ }
+}
+]