diff --git a/members/wikipedia-mla.xml b/members/wikipedia-mla.xml index 22063eb7..401895db 100644 --- a/members/wikipedia-mla.xml +++ b/members/wikipedia-mla.xml @@ -112,7 +112,7 @@ - + @@ -124,7 +124,7 @@ - + @@ -139,7 +139,7 @@ - + @@ -168,8 +168,8 @@ - - + + @@ -242,7 +242,7 @@ - + @@ -284,4 +284,5 @@ + diff --git a/pyscraper/ni/wikipedia-mla.py b/pyscraper/ni/wikipedia-mla.py index 95780084..cbb092e0 100755 --- a/pyscraper/ni/wikipedia-mla.py +++ b/pyscraper/ni/wikipedia-mla.py @@ -36,7 +36,7 @@ def read(y): matches.update(re.findall(matcher, content)) # 4-6th Assembly changes -changes = re.findall('(?s)

]*>MLAs by constituency.*?

]*>Changes(.*?)', content) +changes = re.findall('(?s)]*>(?:]*>)?MLAs by constituency.*?]*>(?:]*>)?Changes(.*?)', content) for change in changes: for m in re.findall('''(?x)