From a4b5ecfd28b1657d288676e025c1b1641fa94d9b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Cruz=20N=C3=BA=C3=B1ez?= Date: Thu, 19 Sep 2024 11:59:53 -0400 Subject: [PATCH] improve docstring and simplify parsing of source --- city_scrapers/spiders/losca_Board_of_Supervisors.py | 13 ++----------- 1 file changed, 2 insertions(+), 11 deletions(-) diff --git a/city_scrapers/spiders/losca_Board_of_Supervisors.py b/city_scrapers/spiders/losca_Board_of_Supervisors.py index 9feed3d..b6625f7 100644 --- a/city_scrapers/spiders/losca_Board_of_Supervisors.py +++ b/city_scrapers/spiders/losca_Board_of_Supervisors.py @@ -11,12 +11,7 @@ class LoscaBoardOfSupervisorsSpider(CityScrapersSpider): start_urls = ["https://bos.lacounty.gov/board-meeting-agendas/"] def parse(self, response): - """ - `parse` should always `yield` Meeting items. - - Change the `_parse_title`, `_parse_start`, etc methods to fit your scraping - needs. - """ + """Parse meeting items from agency website.""" location = { "name": "Kenneth Hahn Hall of Administration", "address": "500 West Temple Street, Room 381B, Los Angeles", @@ -36,7 +31,7 @@ def parse(self, response): time_notes="", location=location, links=self._parse_links(item), - source=self._parse_source(response), + source=response.url, ) meeting["status"] = self._get_status(meeting) @@ -74,7 +69,3 @@ def _parse_links(self, item): href = link.css("::attr(href)").get() out.append({"title": title, "href": href}) return out - - def _parse_source(self, response): - """Parse or generate source.""" - return response.url