Skip to content

Commit bdb2f35

Browse files
KS: votes: fix same outlier 500 on bill HCR 5011
1 parent e0de4e2 commit bdb2f35

File tree

1 file changed

+14
-1
lines changed

1 file changed

+14
-1
lines changed

scrapers/ks/votes.py

+14-1
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@
44
import feedparser
55

66
import lxml.html
7+
from scrapelib import HTTPError
78
from openstates.scrape import Scraper, VoteEvent
89

910

@@ -34,7 +35,19 @@ def scrape_bill_list(self, session):
3435
yield from self.scrape_vote_from_bill(session, bill_id, item.guid)
3536

3637
def scrape_vote_from_bill(self, session, bill, url):
37-
doc = lxml.html.fromstring(self.get(url, retry_on_404=True).text)
38+
try:
39+
vote_response = self.get(url, retry_on_404=True)
40+
except HTTPError as e:
41+
# 500 error on HCR 5011 for some reason
42+
# temporarily swallow this exception to allow scrape to finish
43+
if bill == "HCR 5011":
44+
self.logger.warning(
45+
f"Swallowing HTTPError for {bill} as a temporary fix: {e}"
46+
)
47+
return
48+
else:
49+
raise e
50+
doc = lxml.html.fromstring(vote_response.text)
3851
doc.make_links_absolute(url)
3952
all_links = doc.xpath(
4053
"//table[@class='bottom']/tbody[@class='tab-content-sub']/tr/td/a/@href"

0 commit comments

Comments
 (0)