Skip to content

Commit

Permalink
[UK] Update for new register website.
Browse files Browse the repository at this point in the history
  • Loading branch information
dracos authored and TheyWorkForYou Live CVS User committed Sep 5, 2020
1 parent a130c50 commit 9b900c5
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions pyscraper/regmem/pullgluepages.py
Original file line number Diff line number Diff line change
Expand Up @@ -163,13 +163,13 @@ def FindRegmemPages():
'/pa/cm/cmregmem/925/part1contents.htm': '2013-01-18',
}
urls = []
idxurl = 'http://www.publications.parliament.uk/pa/cm/cmregmem.htm'
idxurl = 'https://www.parliament.uk/mps-lords-and-offices/standards-and-financial-interests/parliamentary-commissioner-for-standards/registers-of-interests/register-of-members-financial-interests/'
ur = urllib.urlopen(idxurl)
content = ur.read()
ur.close()

soup = BeautifulSoup.BeautifulSoup(content)
soup = soup.find(id='content').find('ul')
soup = soup.find(attrs='main-body').find('ul')
ixurls = [urlparse.urljoin(idxurl, ix['href']) for ix in soup.findAll('a', href=True)]

for ixurl in ixurls:
Expand Down

0 comments on commit 9b900c5

Please sign in to comment.