File tree 1 file changed +14
-1
lines changed
1 file changed +14
-1
lines changed Original file line number Diff line number Diff line change 4
4
import feedparser
5
5
6
6
import lxml .html
7
+ from scrapelib import HTTPError
7
8
from openstates .scrape import Scraper , VoteEvent
8
9
9
10
@@ -34,7 +35,19 @@ def scrape_bill_list(self, session):
34
35
yield from self .scrape_vote_from_bill (session , bill_id , item .guid )
35
36
36
37
def scrape_vote_from_bill (self , session , bill , url ):
37
- doc = lxml .html .fromstring (self .get (url , retry_on_404 = True ).text )
38
+ try :
39
+ vote_response = self .get (url , retry_on_404 = True )
40
+ except HTTPError as e :
41
+ # 500 error on HCR 5011 for some reason
42
+ # temporarily swallow this exception to allow scrape to finish
43
+ if bill == "HCR 5011" :
44
+ self .logger .warning (
45
+ f"Swallowing HTTPError for { bill } as a temporary fix: { e } "
46
+ )
47
+ return
48
+ else :
49
+ raise e
50
+ doc = lxml .html .fromstring (vote_response .text )
38
51
doc .make_links_absolute (url )
39
52
all_links = doc .xpath (
40
53
"//table[@class='bottom']/tbody[@class='tab-content-sub']/tr/td/a/@href"
You can’t perform that action at this time.
0 commit comments