From a29144f89e0fe4e3e37ebd70c51471f2e02bfbaf Mon Sep 17 00:00:00 2001 From: trevineju Date: Wed, 5 Jun 2024 17:12:04 -0300 Subject: [PATCH] Adiciona 9 novos raspadores --- .../gazette/spiders/ce/ce_limoeiro_do_norte.py | 11 +++++++++++ data_collection/gazette/spiders/ce/ce_milagres.py | 11 +++++++++++ data_collection/gazette/spiders/ce/ce_pacajus.py | 11 +++++++++++ data_collection/gazette/spiders/ce/ce_paramoti.py | 11 +++++++++++ data_collection/gazette/spiders/ce/ce_pereiro.py | 11 +++++++++++ data_collection/gazette/spiders/ce/ce_sao_benedito.py | 11 +++++++++++ data_collection/gazette/spiders/ce/ce_taua.py | 11 +++++++++++ data_collection/gazette/spiders/ce/ce_tiangua.py | 11 +++++++++++ data_collection/gazette/spiders/ce/ce_uruoca.py | 11 +++++++++++ 9 files changed, 99 insertions(+) create mode 100644 data_collection/gazette/spiders/ce/ce_limoeiro_do_norte.py create mode 100644 data_collection/gazette/spiders/ce/ce_milagres.py create mode 100644 data_collection/gazette/spiders/ce/ce_pacajus.py create mode 100644 data_collection/gazette/spiders/ce/ce_paramoti.py create mode 100644 data_collection/gazette/spiders/ce/ce_pereiro.py create mode 100644 data_collection/gazette/spiders/ce/ce_sao_benedito.py create mode 100644 data_collection/gazette/spiders/ce/ce_taua.py create mode 100644 data_collection/gazette/spiders/ce/ce_tiangua.py create mode 100644 data_collection/gazette/spiders/ce/ce_uruoca.py diff --git a/data_collection/gazette/spiders/ce/ce_limoeiro_do_norte.py b/data_collection/gazette/spiders/ce/ce_limoeiro_do_norte.py new file mode 100644 index 000000000..e0019034e --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_limoeiro_do_norte.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CeLimoeiroDoNorteSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2307601" + name = "ce_limoeiro_do_norte" + allowed_domains = ["limoeirodonorte.ce.gov.br"] + BASE_URL = "https://www.limoeirodonorte.ce.gov.br" + start_date = date(2017, 4, 10) diff --git a/data_collection/gazette/spiders/ce/ce_milagres.py b/data_collection/gazette/spiders/ce/ce_milagres.py new file mode 100644 index 000000000..29cc0004e --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_milagres.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CeMilagresSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2308302" + name = "ce_milagres" + allowed_domains = ["milagres.ce.gov.br"] + BASE_URL = "https://www.milagres.ce.gov.br" + start_date = date(2016, 5, 20) diff --git a/data_collection/gazette/spiders/ce/ce_pacajus.py b/data_collection/gazette/spiders/ce/ce_pacajus.py new file mode 100644 index 000000000..5a71d4dd5 --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_pacajus.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CePacajusSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2309607" + name = "ce_pacajus" + allowed_domains = ["pacajus.ce.gov.br"] + BASE_URL = "https://www.pacajus.ce.gov.br" + start_date = date(2018, 10, 26) diff --git a/data_collection/gazette/spiders/ce/ce_paramoti.py b/data_collection/gazette/spiders/ce/ce_paramoti.py new file mode 100644 index 000000000..98811d851 --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_paramoti.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CeParamotiSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2310407" + name = "ce_paramoti" + allowed_domains = ["paramoti.ce.gov.br"] + BASE_URL = "https://www.paramoti.ce.gov.br" + start_date = date(2023, 1, 2) diff --git a/data_collection/gazette/spiders/ce/ce_pereiro.py b/data_collection/gazette/spiders/ce/ce_pereiro.py new file mode 100644 index 000000000..c7e3c7049 --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_pereiro.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CePereiroSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2310803" + name = "ce_pereiro" + allowed_domains = ["pereiro.ce.gov.br"] + BASE_URL = "https://www.pereiro.ce.gov.br" + start_date = date(2020, 1, 3) diff --git a/data_collection/gazette/spiders/ce/ce_sao_benedito.py b/data_collection/gazette/spiders/ce/ce_sao_benedito.py new file mode 100644 index 000000000..7093e7d26 --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_sao_benedito.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CeSaoBeneditoSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2312304" + name = "ce_sao_benedito" + allowed_domains = ["saobenedito.ce.gov.br"] + BASE_URL = "https://www.saobenedito.ce.gov.br" + start_date = date(18, 2, 15) diff --git a/data_collection/gazette/spiders/ce/ce_taua.py b/data_collection/gazette/spiders/ce/ce_taua.py new file mode 100644 index 000000000..1e86dfd2e --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_taua.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CeTauaSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2313302" + name = "ce_taua" + allowed_domains = ["taua.ce.gov.br"] + BASE_URL = "https://www.taua.ce.gov.br" + start_date = date(2019, 8, 30) diff --git a/data_collection/gazette/spiders/ce/ce_tiangua.py b/data_collection/gazette/spiders/ce/ce_tiangua.py new file mode 100644 index 000000000..0b9df9aa7 --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_tiangua.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CeTianguaSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2313401" + name = "ce_tiangua" + allowed_domains = ["tiangua.ce.gov.br"] + BASE_URL = "https://www.tiangua.ce.gov.br" + start_date = date(2021, 11, 3) diff --git a/data_collection/gazette/spiders/ce/ce_uruoca.py b/data_collection/gazette/spiders/ce/ce_uruoca.py new file mode 100644 index 000000000..7768586a6 --- /dev/null +++ b/data_collection/gazette/spiders/ce/ce_uruoca.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.adiarios_v1 import BaseAdiariosV1Spider + + +class CeUruocaSpider(BaseAdiariosV1Spider): + TERRITORY_ID = "2313906" + name = "ce_uruoca" + allowed_domains = ["uruoca.ce.gov.br"] + BASE_URL = "https://www.uruoca.ce.gov.br" + start_date = date(2017, 1, 2)