Skip to content

Commit 9b900c5

Browse files
dracosTheyWorkForYou Live CVS User
authored andcommitted
[UK] Update for new register website.
1 parent a130c50 commit 9b900c5

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

pyscraper/regmem/pullgluepages.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -163,13 +163,13 @@ def FindRegmemPages():
163163
'/pa/cm/cmregmem/925/part1contents.htm': '2013-01-18',
164164
}
165165
urls = []
166-
idxurl = 'http://www.publications.parliament.uk/pa/cm/cmregmem.htm'
166+
idxurl = 'https://www.parliament.uk/mps-lords-and-offices/standards-and-financial-interests/parliamentary-commissioner-for-standards/registers-of-interests/register-of-members-financial-interests/'
167167
ur = urllib.urlopen(idxurl)
168168
content = ur.read()
169169
ur.close()
170170

171171
soup = BeautifulSoup.BeautifulSoup(content)
172-
soup = soup.find(id='content').find('ul')
172+
soup = soup.find(attrs='main-body').find('ul')
173173
ixurls = [urlparse.urljoin(idxurl, ix['href']) for ix in soup.findAll('a', href=True)]
174174

175175
for ixurl in ixurls:

0 commit comments

Comments
 (0)