From 5fcec33d799471efa4f58c8778eaf1c1137fb5e3 Mon Sep 17 00:00:00 2001 From: TaTi Lattanzi Date: Thu, 26 Oct 2023 15:52:44 -0300 Subject: [PATCH 1/5] =?UTF-8?q?add=20Arape=C3=AD=20(SP)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- data_collection/gazette/spiders/sp/sp_arapei.py | 11 +++++++++++ scripts/enabled_spiders.py | 1 + 2 files changed, 12 insertions(+) create mode 100644 data_collection/gazette/spiders/sp/sp_arapei.py diff --git a/data_collection/gazette/spiders/sp/sp_arapei.py b/data_collection/gazette/spiders/sp/sp_arapei.py new file mode 100644 index 000000000..73a63bf05 --- /dev/null +++ b/data_collection/gazette/spiders/sp/sp_arapei.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.instar import BaseInstarSpider + + +class SpArapeiSpider(BaseInstarSpider): + TERRITORY_ID = "3503158" + name = "sp_arapei" + allowed_domains = ["arapei.sp.gov.br"] + base_url = "https://www.arapei.sp.gov.br/portal/diario-oficial" + start_date = date(2021, 5, 27) diff --git a/scripts/enabled_spiders.py b/scripts/enabled_spiders.py index 7c0436cf9..55af467e2 100644 --- a/scripts/enabled_spiders.py +++ b/scripts/enabled_spiders.py @@ -130,6 +130,7 @@ "sp_aparecida", "sp_aracariguama", "sp_aracatuba", + "sp_arapei", "sp_avare", "sp_barao_de_antonina", "sp_birigui", From ecf67b9f3cf2cd2b0e0e3e6c06dedc38efc9f631 Mon Sep 17 00:00:00 2001 From: TaTi Lattanzi Date: Thu, 26 Oct 2023 15:57:52 -0300 Subject: [PATCH 2/5] =?UTF-8?q?add=20Turi=C3=BAba=20(SP)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- data_collection/gazette/spiders/sp/sp_turiuba.py | 11 +++++++++++ scripts/enabled_spiders.py | 1 + 2 files changed, 12 insertions(+) create mode 100644 data_collection/gazette/spiders/sp/sp_turiuba.py diff --git a/data_collection/gazette/spiders/sp/sp_turiuba.py b/data_collection/gazette/spiders/sp/sp_turiuba.py new file mode 100644 index 000000000..2766ea227 --- /dev/null +++ b/data_collection/gazette/spiders/sp/sp_turiuba.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.instar import BaseInstarSpider + + +class SpTuriubaSpider(BaseInstarSpider): + TERRITORY_ID = "3555208" + name = "sp_turiuba" + allowed_domains = ["turiuba.sp.gov.br"] + base_url = "https://www.turiuba.sp.gov.br/portal/diario-oficial" + start_date = date(2020, 6, 19) diff --git a/scripts/enabled_spiders.py b/scripts/enabled_spiders.py index 55af467e2..a735e8c06 100644 --- a/scripts/enabled_spiders.py +++ b/scripts/enabled_spiders.py @@ -193,6 +193,7 @@ "sp_sertaozinho", "sp_sumare", "sp_taquaral", + "sp_turiuba", "sp_valinhos", "sp_valparaiso", "sp_vera_cruz", From 4068c8566e50b61a6549537fa863149c9026da4b Mon Sep 17 00:00:00 2001 From: TaTi Lattanzi Date: Thu, 26 Oct 2023 15:59:38 -0300 Subject: [PATCH 3/5] add Dirce Reis (SP) --- data_collection/gazette/spiders/sp/sp_dirce_reis.py | 11 +++++++++++ scripts/enabled_spiders.py | 1 + 2 files changed, 12 insertions(+) create mode 100644 data_collection/gazette/spiders/sp/sp_dirce_reis.py diff --git a/data_collection/gazette/spiders/sp/sp_dirce_reis.py b/data_collection/gazette/spiders/sp/sp_dirce_reis.py new file mode 100644 index 000000000..a3e9f5918 --- /dev/null +++ b/data_collection/gazette/spiders/sp/sp_dirce_reis.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.instar import BaseInstarSpider + + +class SpDirceReisSpider(BaseInstarSpider): + TERRITORY_ID = "3513850" + name = "sp_dirce_reis" + allowed_domains = ["dircereis.sp.gov.br"] + base_url = "https://www.dircereis.sp.gov.br/portal/diario-oficial" + start_date = date(2019, 10, 7) diff --git a/scripts/enabled_spiders.py b/scripts/enabled_spiders.py index a735e8c06..81f7c33bc 100644 --- a/scripts/enabled_spiders.py +++ b/scripts/enabled_spiders.py @@ -141,6 +141,7 @@ "sp_campo_limpo_paulista", "sp_catanduva", "sp_coronel_macedo", + "sp_dirce_reis", "sp_dracena", "sp_floreal", "sp_glicerio", From 0e60d561d34f5828f7111682de4046e6c5b6ac69 Mon Sep 17 00:00:00 2001 From: TaTi Lattanzi Date: Thu, 26 Oct 2023 16:01:36 -0300 Subject: [PATCH 4/5] =?UTF-8?q?add=20Uni=C3=A3o=20Paulista=20(SP)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../gazette/spiders/sp/sp_uniao_paulista.py | 11 +++++++++++ scripts/enabled_spiders.py | 1 + 2 files changed, 12 insertions(+) create mode 100644 data_collection/gazette/spiders/sp/sp_uniao_paulista.py diff --git a/data_collection/gazette/spiders/sp/sp_uniao_paulista.py b/data_collection/gazette/spiders/sp/sp_uniao_paulista.py new file mode 100644 index 000000000..37cd0ed85 --- /dev/null +++ b/data_collection/gazette/spiders/sp/sp_uniao_paulista.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.instar import BaseInstarSpider + + +class SpUniaoPaulistaSpider(BaseInstarSpider): + TERRITORY_ID = "3555703" + name = "sp_uniao_paulista" + allowed_domains = ["uniaopaulista.sp.gov.br"] + base_url = "https://www.uniaopaulista.sp.gov.br/portal/diario-oficial" + start_date = date(2023, 1, 11) diff --git a/scripts/enabled_spiders.py b/scripts/enabled_spiders.py index 81f7c33bc..54b8afb1e 100644 --- a/scripts/enabled_spiders.py +++ b/scripts/enabled_spiders.py @@ -195,6 +195,7 @@ "sp_sumare", "sp_taquaral", "sp_turiuba", + "sp_uniao_paulista", "sp_valinhos", "sp_valparaiso", "sp_vera_cruz", From d34fa2ca909c8c332409ac13baa18dbf54d08d9d Mon Sep 17 00:00:00 2001 From: TaTi Lattanzi Date: Thu, 26 Oct 2023 16:03:04 -0300 Subject: [PATCH 5/5] add Nova Castilho (SP) --- .../gazette/spiders/sp/sp_nova_castilho.py | 11 +++++++++++ scripts/enabled_spiders.py | 1 + 2 files changed, 12 insertions(+) create mode 100644 data_collection/gazette/spiders/sp/sp_nova_castilho.py diff --git a/data_collection/gazette/spiders/sp/sp_nova_castilho.py b/data_collection/gazette/spiders/sp/sp_nova_castilho.py new file mode 100644 index 000000000..ac41c8d13 --- /dev/null +++ b/data_collection/gazette/spiders/sp/sp_nova_castilho.py @@ -0,0 +1,11 @@ +from datetime import date + +from gazette.spiders.base.instar import BaseInstarSpider + + +class SpNovaCastilhoSpider(BaseInstarSpider): + TERRITORY_ID = "3532868" + name = "sp_nova_castilho" + allowed_domains = ["novacastilho.sp.gov.br"] + base_url = "https://www.novacastilho.sp.gov.br/portal/diario-oficial" + start_date = date(2021, 1, 29) diff --git a/scripts/enabled_spiders.py b/scripts/enabled_spiders.py index 54b8afb1e..69b065137 100644 --- a/scripts/enabled_spiders.py +++ b/scripts/enabled_spiders.py @@ -167,6 +167,7 @@ "sp_mogi_guacu", "sp_monte_mor", "sp_nova_luzitania", + "sp_nova_castilho", "sp_osasco", "sp_ourinhos", "sp_parisi",