From f3ea32d75536a6a0ec1230a1d8fc36dd08b020f8 Mon Sep 17 00:00:00 2001 From: Matthew Somerville Date: Mon, 22 Apr 2024 17:23:09 +0100 Subject: [PATCH] fixup! Add scraper for new Scottish Parliament site --- pyscraper/sp_2024/parse.py | 8 +------- 1 file changed, 1 insertion(+), 7 deletions(-) diff --git a/pyscraper/sp_2024/parse.py b/pyscraper/sp_2024/parse.py index eba26735..883f2e36 100644 --- a/pyscraper/sp_2024/parse.py +++ b/pyscraper/sp_2024/parse.py @@ -160,13 +160,7 @@ def process_raw_html(html: str, agenda_item_url: str): vote_div = soup.new_tag("msplist") vote_div["vote"] = vote_str # get all the speakers in the next sibling - members = ( - str(vote_tag.find_next_sibling("p")) - .replace("

", "") - .replace("

", "") - .split("
") - ) - members = [x.strip() for x in members] + members = vote_tag.find_next_sibling("p").stripped_strings for m in members: mspname = soup.new_tag("mspname")