1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
|
# -*- coding: utf-8 -*-
# Generated by Django 1.11 on 2019-08-07 01:17
from __future__ import unicode_literals
import datetime
import django.contrib.postgres.fields.jsonb
import django.contrib.sites.models
from django.db import migrations, models
import django.db.models.deletion
class Migration(migrations.Migration):
initial = True
dependencies = [
('commorganization', '0001_initial'),
]
operations = [
migrations.CreateModel(
name='Crawl',
fields=[
('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
('name', models.CharField(max_length=200, unique=True, verbose_name='Name')),
('created', models.DateTimeField(default=datetime.datetime.now, verbose_name='Creation date')),
('started', models.DateTimeField(blank=True, null=True, verbose_name='Start date')),
('ended', models.DateTimeField(blank=True, null=True, verbose_name='End date')),
('status', models.CharField(choices=[('C', 'Created'), ('P', 'In progress'), ('F', 'Finished')], default='C', max_length=1, verbose_name='Status')),
('targets', models.ManyToManyField(blank=True, to='commorganization.Target')),
],
options={
'verbose_name_plural': 'Crawls',
'verbose_name': 'Crawl',
'ordering': ('created', 'name'),
},
),
migrations.CreateModel(
name='CrawlLink',
fields=[
('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
('link', models.URLField(verbose_name='Link')),
],
options={
'verbose_name_plural': 'Crawl links',
'verbose_name': 'Crawl link',
},
),
migrations.CreateModel(
name='CrawlRelation',
fields=[
('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
('number', models.IntegerField(default=1, verbose_name='Number')),
('crawl', models.ForeignKey(on_delete=django.db.models.deletion.CASCADE, to='commcrawler.Crawl', verbose_name='Crawl')),
('destination', models.ForeignKey(on_delete=django.db.models.deletion.CASCADE, related_name='relation_destination', to='commorganization.Target', verbose_name='Destination')),
('source', models.ForeignKey(on_delete=django.db.models.deletion.CASCADE, related_name='relation_source', to='commorganization.Target', verbose_name='Source')),
],
options={
'verbose_name_plural': 'Crawl relations',
'verbose_name': 'Crawl relation',
},
),
migrations.CreateModel(
name='CrawlResult',
fields=[
('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
('started', models.DateTimeField(default=datetime.datetime.now, verbose_name='Start date')),
('duration', models.DurationField(blank=True, null=True, verbose_name='Duration')),
('status', models.CharField(choices=[('P', 'In progress'), ('F', 'Finished')], default='P', max_length=1, verbose_name='Status')),
('crawl_result', django.contrib.postgres.fields.jsonb.JSONField(default=list, verbose_name='Crawl result')),
('nb_external_link', models.IntegerField(default=0, verbose_name='Number of external links')),
('nb_internal_link', models.IntegerField(default=0, verbose_name='Number of internal links')),
('nb_images', models.IntegerField(default=0, verbose_name='Number of images')),
('nb_facebook', models.IntegerField(default=0, verbose_name='Number of Facebook links')),
('nb_twitter', models.IntegerField(default=0, verbose_name='Number of Twitter links')),
('nb_instagram', models.IntegerField(default=0, verbose_name='Number of Instagram links')),
('nb_youtube', models.IntegerField(default=0, verbose_name='Number of Youtube links')),
('nb_dailymotion', models.IntegerField(default=0, verbose_name='Number of Dailymotion links')),
('nb_vimeo', models.IntegerField(default=0, verbose_name='Number of Vimeo links')),
('nb_video', models.IntegerField(default=0, verbose_name='Number of videos')),
('nb_audio', models.IntegerField(default=0, verbose_name='Number of audios')),
('nb_internal_pdf', models.IntegerField(default=0, verbose_name='Number of internal PDF')),
('nb_external_pdf', models.IntegerField(default=0, verbose_name='Number of external PDF')),
('nb_internal_office', models.IntegerField(default=0, verbose_name='Number of internal office documents')),
('nb_external_office', models.IntegerField(default=0, verbose_name='Number of external office documents')),
('is_online', models.BooleanField(default=False, verbose_name='Website is online')),
('redirection', models.URLField(blank=True, null=True, verbose_name='Redirection')),
('crawl', models.ForeignKey(on_delete=django.db.models.deletion.CASCADE, to='commcrawler.Crawl', verbose_name='Crawl')),
('target', models.ForeignKey(on_delete=django.db.models.deletion.CASCADE, to='commorganization.Target', verbose_name='Target')),
],
options={
'verbose_name_plural': 'Crawl results',
'verbose_name': 'Crawl result',
},
),
migrations.CreateModel(
name='ExludedDomains',
fields=[
('id', models.AutoField(auto_created=True, primary_key=True, serialize=False, verbose_name='ID')),
('domain', models.CharField(max_length=100, unique=True, validators=[django.contrib.sites.models._simple_domain_name_validator], verbose_name='Domain name')),
],
options={
'verbose_name_plural': 'Excluded domains',
'verbose_name': 'Excluded domain',
},
),
migrations.AddField(
model_name='crawllink',
name='result',
field=models.ForeignKey(on_delete=django.db.models.deletion.CASCADE, to='commcrawler.CrawlResult', verbose_name='Result'),
),
migrations.AlterUniqueTogether(
name='crawlresult',
unique_together=set([('crawl', 'target')]),
),
migrations.AlterUniqueTogether(
name='crawlrelation',
unique_together=set([('crawl', 'source', 'destination')]),
),
]
|