C
|
ca
|
2024-04-23 04:40:58
|
2024-04-23 04:40:58
|
|
C
|
ca_ab
|
2024-04-23 04:17:55
|
2024-04-23 04:17:55
|
|
D>
04:25:27 WARNING scrapelib: got ('Connection aborted.', ConnectionResetError(104, 'Connection reset by peer')) sleeping for 10 seconds before retry
04:25:38 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:4806016/legislature yet
|
ca_ab_calgary
|
|
2024-04-23 04:25:38
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_ab_calgary/people.py", line 15, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:44:57 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/province:ab/executive yet
|
ca_ab_candidates
|
|
2024-04-23 04:44:57
|
pupa.exceptions.UnresolvedIdError: cannot resolve pseudo id to Post: ~{"label": "Edmonton-Mill Woods", "organization__classi…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 307, in do_handle
report['import'] = self.do_import(juris, args)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 211, in do_import
report.update(membership_importer.import_directory(datadir))
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 190, in import_directory
return self.import_data(json_stream())
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 227, in import_data
obj_id, what = self.import_item(data)
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 247, in import_item
data = self.prepare_for_db(data)
File "/app/.heroku/src/pupa/pupa/importers/memberships.py", line 50, in prepare_for_db
data['post_id'] = self.post_importer.resolve_json_id(data['post_id'])
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 165, in resolve_json_id
raise UnresolvedIdError(errmsg)
pupa.exceptions.UnresolvedIdError: cannot resolve pseudo id to Post: ~{"label": "Edmonton-Mill Woods", "organization__classification": "executive", "role": "MLA"}
|
D>
04:13:21 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:4811061/legislature yet
|
ca_ab_edmonton
|
|
2024-04-23 04:13:21
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_ab_edmonton/people.py", line 14, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:13:23 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:4819012/legislature yet
|
ca_ab_grande_prairie
|
|
2024-04-23 04:13:23
|
KeyError: 'name'
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 394, in scrape
if not self.is_valid_row(row):
File "/app/scrapers/utils.py", line 348, in is_valid_row
return row["name"] not in empty
KeyError: 'name'
|
C
|
ca_ab_grande_prairie_county_no_1
|
2024-04-23 04:04:41
|
2024-04-23 04:04:41
|
|
D>
04:20:27 WARNING scrapelib: sleeping for 10 seconds before retry
04:20:37 WARNING scrapelib: sleeping for 20 seconds before retry
04:20:57 WARNING scrapelib: sleeping for 40 seconds before retry
|
ca_ab_lethbridge
|
2022-12-08 04:08:13
|
2024-04-23 04:21:37
|
scrapelib.HTTPError: 410 while retrieving https://docs.google.com/spreadsheets/d/1OnHJq_j-r3R4MMkRQ5ahNkApuDp1NpTYn4UVTTNGY5…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 410 while retrieving https://docs.google.com/spreadsheets/d/1OnHJq_j-r3R4MMkRQ5ahNkApuDp1NpTYn4UVTTNGY5c/pub?gid=908195318&single=true&output=csv
|
D>
|
ca_ab_strathcona_county
|
2023-12-01 04:03:03
|
2024-04-23 04:15:50
|
KeyError: 'name'
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 394, in scrape
if not self.is_valid_row(row):
File "/app/scrapers/utils.py", line 348, in is_valid_row
return row["name"] not in empty
KeyError: 'name'
|
D>
04:19:51 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:4816037/legislature yet
|
ca_ab_wood_buffalo
|
|
2024-04-23 04:19:51
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_ab_wood_buffalo/people.py", line 15, in scrape
mayor_url = page.xpath('//li[@id="pageid1075"]/div/a/@href')[0]
IndexError: list index out of range
|
D>
|
ca_bc
|
2024-04-23 04:19:39
|
2024-04-23 05:32:54
|
SystemExit: 1
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_bc/people.py", line 27, in scrape
page = self.lxmlize(url)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 579, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 404, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 232, in request
return super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 122, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 589, in request
resp = self.send(prep, **send_kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 703, in send
r = adapter.send(request, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/adapters.py", line 486, in send
resp = conn.urlopen(
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/connectionpool.py", line 715, in urlopen
httplib_response = self._make_request(
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/connectionpool.py", line 467, in _make_request
six.raise_from(e, None)
File "<string>", line 3, in raise_from
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/connectionpool.py", line 462, in _make_request
httplib_response = conn.getresponse()
File "/app/.heroku/python/lib/python3.8/http/client.py", line 1348, in getresponse
response.begin()
File "/app/.heroku/python/lib/python3.8/http/client.py", line 316, in begin
version, status, reason = self._read_status()
File "/app/.heroku/python/lib/python3.8/http/client.py", line 277, in _read_status
line = str(self.fp.readline(_MAXLINE + 1), "iso-8859-1")
File "/app/.heroku/python/lib/python3.8/socket.py", line 669, in readinto
return self._sock.recv_into(b)
File "/app/.heroku/python/lib/python3.8/ssl.py", line 1274, in recv_into
return self.read(nbytes, buffer)
File "/app/.heroku/python/lib/python3.8/ssl.py", line 1132, in read
return self._sslobj.read(len, buffer)
File "/app/.heroku/python/lib/python3.8/site-packages/gunicorn/workers/base.py", line 196, in handle_abort
sys.exit(1)
SystemExit: 1
|
D>
04:04:44 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:5909052/legislature yet
|
ca_bc_abbotsford
|
|
2024-04-23 04:04:44
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_bc_abbotsford/people.py", line 19, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:44:48 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:5915025/legislature yet
|
ca_bc_burnaby
|
|
2024-04-23 04:44:48
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_bc_burnaby/people.py", line 13, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:03:22 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:5915034/legislature yet
|
ca_bc_coquitlam
|
|
2024-04-23 04:03:22
|
scrapelib.HTTPError: 404 while retrieving https://www.coquitlam.ca/city-hall/mayor-and-council/mayor-and-council.aspx
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_bc_coquitlam/people.py", line 11, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.coquitlam.ca/city-hall/mayor-and-council/mayor-and-council.aspx
|
C
|
ca_bc_kelowna
|
2024-04-23 04:13:24
|
2024-04-23 04:13:24
|
|
D>
|
ca_bc_langley
|
2022-10-18 04:01:08
|
2024-04-23 04:04:42
|
scrapelib.HTTPError: 404 while retrieving https://opendata.arcgis.com/datasets/daa3ea0f01d24e9b80d837cf2178eb71_0.csv
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://opendata.arcgis.com/datasets/daa3ea0f01d24e9b80d837cf2178eb71_0.csv
|
D>
04:01:43 WARNING scrapelib: sleeping for 10 seconds before retry
04:01:53 WARNING scrapelib: sleeping for 20 seconds before retry
04:02:13 WARNING scrapelib: sleeping for 40 seconds before retry
04:02:54 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/province:bc/government yet
|
ca_bc_municipalities
|
|
2024-04-23 04:02:54
|
scrapelib.HTTPError: 403 while retrieving https://www.civicinfo.bc.ca/people
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_bc_municipalities/people.py", line 67, in scrape
list_page = self.lxmlize(LIST_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 403 while retrieving https://www.civicinfo.bc.ca/people
|
C
|
ca_bc_municipalities_candidates
|
2024-04-23 04:27:23
|
2024-04-23 04:27:24
|
|
D>
04:43:29 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:5915029/legislature yet
|
ca_bc_new_westminster
|
|
2024-04-23 04:43:29
|
scrapelib.HTTPError: 404 while retrieving https://opendata.newwestcity.ca/downloads/councillor-contact-information/councillo…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://opendata.newwestcity.ca/downloads/councillor-contact-information/councillor_contacts.csv
|
D>
|
ca_bc_richmond
|
2023-04-29 04:03:23
|
2024-04-23 04:15:59
|
scrapelib.HTTPError: 404 while retrieving https://www.richmond.ca/contact/departments/council.htm
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_bc_richmond/people.py", line 12, in scrape
contact_page = self.lxmlize(CONTACT_URL)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.richmond.ca/contact/departments/council.htm
|
C
|
ca_bc_saanich
|
2024-04-23 04:16:08
|
2024-04-23 04:16:08
|
|
D>
04:20:26 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:5915004/legislature yet
|
ca_bc_surrey
|
|
2024-04-23 04:20:26
|
AssertionError: No members found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_bc_surrey/people.py", line 14, in scrape
assert len(members), "No members found"
AssertionError: No members found
|
C
|
ca_bc_vancouver
|
2024-04-23 04:05:53
|
2024-04-23 04:05:53
|
|
D>
04:28:09 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:5917034/legislature yet
|
ca_bc_victoria
|
|
2024-04-23 04:28:09
|
KeyError: 'primary role'
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 413, in scrape
role = row["primary role"]
KeyError: 'primary role'
|
C
|
ca_candidates
|
2024-04-23 04:00:49
|
2024-04-23 04:00:49
|
|
C
|
ca_mb
|
2024-04-23 04:05:45
|
2024-04-23 04:05:45
|
|
D>
04:19:55 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/province:mb/executive yet
|
ca_mb_candidates
|
|
2024-04-23 04:19:55
|
obj2 sources: []
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 307, in do_handle
report['import'] = self.do_import(juris, args)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 211, in do_import
report.update(membership_importer.import_directory(datadir))
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 190, in import_directory
return self.import_data(json_stream())
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 227, in import_data
obj_id, what = self.import_item(data)
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 265, in import_item
raise DuplicateItemError(data, obj, related.get('sources', []))
pupa.exceptions.DuplicateItemError: attempt to import data that would conflict with data already in the import: {'label': '', 'role': 'member', 'person_id': 'ocd-person/84f48bcf-ed46-4748-bac8-b8680d3030bc', 'person_name': 'James Beddome', 'organization_id': 'ocd-organization/4343d444-c836-499a-b6ba-8c435656752b', 'post_id': None, 'on_behalf_of_id': None, 'start_date': '', 'end_date': '', 'extras': {}} (already imported as James Beddome in Green Party (member))
obj1 sources: []
obj2 sources: []
|
D>
|
ca_mb_winnipeg
|
2022-10-25 04:10:28
|
2024-04-23 04:20:02
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_mb_winnipeg/people.py", line 22, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:05:51 WARNING pupa: validation of Membership c64a9816-0126-11ef-9f20-6a82ce95162d failed: 1 validation errors:
Value 'town hall.weedon@hsfqc.ca' for field '' does not match regular expression '\A([A-Za-z0-9._\'-]+)@(?:[A-Za-z0-9-]+\.)+[A-Za-z]{2,}\Z'
|
ca_municipalities
|
|
2024-04-23 04:05:51
|
Value 'town hall.weedon@hsfqc.ca' for field '' does not match regular expression '\A([A-Za-z0-9._\'-]+)@(?:[A-Za-z0-9-]+\.)+…
Traceback (most recent call last):
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 175, in validate
validator.validate(self.as_dict(), schema)
File "/app/.heroku/python/lib/python3.8/site-packages/validictory/validator.py", line 620, in validate
raise MultipleValidationError(self._errors)
validictory.validator.MultipleValidationError: 1 validation errors:
Value 'town hall.weedon@hsfqc.ca' for field '' does not match regular expression '\A([A-Za-z0-9._\'-]+)@(?:[A-Za-z0-9-]+\.)+[A-Za-z]{2,}\Z'
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 104, in do_scrape
self.save_object(obj)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 93, in save_object
self.save_object(obj)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 89, in save_object
raise ve
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 85, in save_object
obj.validate()
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 177, in validate
raise ScrapeValueError('validation of {} {} failed: {}'.format(
pupa.exceptions.ScrapeValueError: validation of Membership c64a9816-0126-11ef-9f20-6a82ce95162d failed: 1 validation errors:
Value 'town hall.weedon@hsfqc.ca' for field '' does not match regular expression '\A([A-Za-z0-9._\'-]+)@(?:[A-Za-z0-9-]+\.)+[A-Za-z]{2,}\Z'
|
C
|
ca_nb
|
2024-04-23 04:01:41
|
2024-04-23 04:01:41
|
|
D>
|
ca_nb_fredericton
|
2023-06-18 22:29:30
|
2024-04-23 04:00:31
|
scrapelib.HTTPError: 404 while retrieving https://www.fredericton.ca/en/city-hall/city-council-committees/mayor-council
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_nb_fredericton/people.py", line 9, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.fredericton.ca/en/city-hall/city-council-committees/mayor-council
|
D>
04:15:57 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:1307022/legislature yet
|
ca_nb_moncton
|
|
2024-04-23 04:15:57
|
scrapelib.HTTPError: 404 while retrieving https://opendata.arcgis.com/datasets/d81d30cf2b0d4bf7ae7aea5b0acc9d5f_0.csv
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://opendata.arcgis.com/datasets/d81d30cf2b0d4bf7ae7aea5b0acc9d5f_0.csv
|
D>
04:20:03 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/province:nb/government yet
|
ca_nb_municipalities
|
|
2024-04-23 04:20:03
|
AssertionError: No list items found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_nb_municipalities/people.py", line 65, in scrape
assert len(list_links), "No list items found"
AssertionError: No list items found
|
C
|
ca_nb_saint_john
|
2024-04-23 04:20:23
|
2024-04-23 04:20:23
|
|
C
|
ca_nl
|
2024-04-23 04:15:47
|
2024-04-23 04:15:47
|
|
D>
|
ca_nl_st_john_s
|
2022-10-26 04:07:32
|
2024-04-23 04:26:56
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_nl_st_john_s/people.py", line 15, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
C
|
ca_ns
|
2024-04-23 04:06:50
|
2024-04-23 04:06:50
|
|
D>
04:23:03 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:1217030/legislature yet
|
ca_ns_cape_breton
|
|
2024-04-23 04:23:03
|
pupa.exceptions.SameNameError: multiple people with same name "Lorne Green" in Jurisdiction - must provide birth_date to dis…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 307, in do_handle
report['import'] = self.do_import(juris, args)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 207, in do_import
report.update(person_importer.import_directory(datadir))
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 190, in import_directory
return self.import_data(json_stream())
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 226, in import_data
for json_id, data in self._prepare_imports(data_items):
File "/app/.heroku/src/pupa/pupa/importers/people.py", line 33, in _prepare_imports
raise SameNameError(name)
pupa.exceptions.SameNameError: multiple people with same name "Lorne Green" in Jurisdiction - must provide birth_date to disambiguate
|
D>
04:03:28 WARNING scrapelib: sleeping for 10 seconds before retry
04:03:38 WARNING scrapelib: sleeping for 20 seconds before retry
04:03:58 WARNING scrapelib: sleeping for 40 seconds before retry
04:04:39 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:1209034/legislature yet
|
ca_ns_halifax
|
|
2024-04-23 04:04:39
|
scrapelib.HTTPError: 403 while retrieving https://www.halifax.ca/city-hall/districts-councillors
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_ns_halifax/people.py", line 14, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 403 while retrieving https://www.halifax.ca/city-hall/districts-councillors
|
C
|
ca_on
|
2024-04-23 04:15:41
|
2024-04-23 04:15:41
|
|
D>
04:13:26 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3518005/legislature yet
|
ca_on_ajax
|
|
2024-04-23 04:13:26
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_ajax/people.py", line 27, in scrape
voice = councillor.xpath('.//p[contains(.,"Cel")]/text()')[1]
IndexError: list index out of range
|
D>
04:15:48 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3512005/legislature yet
|
ca_on_belleville
|
|
2024-04-23 04:15:48
|
scrapelib.HTTPError: 404 while retrieving https://www.belleville.ca/city-hall/page/city-council
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_belleville/people.py", line 14, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.belleville.ca/city-hall/page/city-council
|
C
|
ca_on_brampton
|
2024-04-23 04:27:54
|
2024-04-23 04:27:54
|
|
C
|
ca_on_brantford
|
2024-04-23 04:43:34
|
2024-04-23 04:43:34
|
|
D>
04:16:04 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3524002/legislature yet
|
ca_on_burlington
|
|
2024-04-23 04:16:04
|
scrapelib.HTTPError: 404 while retrieving https://opendata.arcgis.com/datasets/f2c404c667904f03be38443cbd474cd3_0.csv
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://opendata.arcgis.com/datasets/f2c404c667904f03be38443cbd474cd3_0.csv
|
D>
04:15:43 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3521024/legislature yet
|
ca_on_caledon
|
|
2024-04-23 04:15:43
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_caledon/people.py", line 11, in scrape
node = page.xpath('//td[@rowspan="2"]')[0]
IndexError: list index out of range
|
C
|
ca_on_cambridge
|
2024-04-23 04:28:08
|
2024-04-23 04:28:08
|
|
D>
04:26:59 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3536020/legislature yet
|
ca_on_chatham_kent
|
|
2024-04-23 04:26:59
|
scrapelib.HTTPError: 404 while retrieving https://www.chatham-kent.ca/local-government/council/council-members
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_chatham_kent/people.py", line 16, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.chatham-kent.ca/local-government/council/council-members
|
C
|
ca_on_fort_erie
|
2024-04-23 04:16:14
|
2024-04-23 04:16:14
|
|
C
|
ca_on_georgina
|
2024-04-23 04:19:49
|
2024-04-23 04:19:49
|
|
C
|
ca_on_greater_sudbury
|
2024-04-23 04:28:13
|
2024-04-23 04:28:13
|
|
D>
|
ca_on_grimsby
|
2024-01-12 04:22:13
|
2024-04-23 04:01:42
|
scrapelib.HTTPError: 404 while retrieving https://niagaraopendata.ca/dataset/fe096749-6ca8-4ae7-b80e-dc682a698759/resource/8…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://niagaraopendata.ca/dataset/fe096749-6ca8-4ae7-b80e-dc682a698759/resource/892a4873-cbe7-4c32-9b70-9f364467955e/download/grimsbycouncil20160210.csv
|
C
|
ca_on_guelph
|
2024-04-23 04:28:14
|
2024-04-23 04:28:14
|
|
D>
04:16:10 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3528018/legislature yet
|
ca_on_haldimand_county
|
|
2024-04-23 04:16:10
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_haldimand_county/people.py", line 14, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:15:44 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3525005/legislature yet
|
ca_on_hamilton
|
|
2024-04-23 04:15:44
|
scrapelib.HTTPError: 404 while retrieving https://www.hamilton.ca/council-committee/mayor-council/city-councillors
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_hamilton/people.py", line 9, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.hamilton.ca/council-committee/mayor-council/city-councillors
|
D>
04:43:32 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/cd:3540/legislature yet
|
ca_on_huron
|
|
2024-04-23 04:43:32
|
pupa.exceptions.UnresolvedIdError: cannot resolve pseudo id to Post: ~{"label": "Huron (seat 1)", "organization__classificat…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 307, in do_handle
report['import'] = self.do_import(juris, args)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 211, in do_import
report.update(membership_importer.import_directory(datadir))
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 190, in import_directory
return self.import_data(json_stream())
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 227, in import_data
obj_id, what = self.import_item(data)
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 247, in import_item
data = self.prepare_for_db(data)
File "/app/.heroku/src/pupa/pupa/importers/memberships.py", line 50, in prepare_for_db
data['post_id'] = self.post_importer.resolve_json_id(data['post_id'])
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 165, in resolve_json_id
raise UnresolvedIdError(errmsg)
pupa.exceptions.UnresolvedIdError: cannot resolve pseudo id to Post: ~{"label": "Huron (seat 1)", "organization__classification": "legislature", "role": "Councillor"}
|
C
|
ca_on_king
|
2024-04-23 04:16:23
|
2024-04-23 04:16:23
|
|
C
|
ca_on_kingston
|
2024-04-23 04:00:35
|
2024-04-23 04:00:35
|
|
C
|
ca_on_kitchener
|
2024-04-23 04:02:57
|
2024-04-23 04:02:57
|
|
D>
04:19:50 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/cd:3538/legislature yet
|
ca_on_lambton
|
|
2024-04-23 04:19:50
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_lambton/people.py", line 15, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
C
|
ca_on_lincoln
|
2024-04-23 04:16:13
|
2024-04-23 04:16:13
|
|
D>
04:16:00 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3539036/legislature yet
|
ca_on_london
|
|
2024-04-23 04:16:00
|
scrapelib.HTTPError: 404 while retrieving https://apps.london.ca/OpenData/CSV/Council.csv
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://apps.london.ca/OpenData/CSV/Council.csv
|
D>
04:19:41 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3519036/legislature yet
|
ca_on_markham
|
|
2024-04-23 04:19:41
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_markham/people.py", line 13, in scrape
mayor_url = page.xpath('//a[contains(text(), "Office of the Mayor")]/@href')[0]
IndexError: list index out of range
|
D>
04:06:57 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3524009/legislature yet
|
ca_on_milton
|
|
2024-04-23 04:06:57
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_milton/people.py", line 14, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
|
ca_on_mississauga
|
2024-03-19 04:07:47
|
2024-04-23 04:06:56
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_mississauga/people.py", line 17, in scrape
yield self.councillor_data(councillor_url.attrib["href"])
File "/app/scrapers/ca_on_mississauga/people.py", line 35, in councillor_data
photo = page.xpath(
IndexError: list index out of range
|
C
|
ca_on_newmarket
|
2024-04-23 04:03:09
|
2024-04-23 04:03:09
|
|
C
|
ca_on_niagara
|
2024-04-23 04:15:52
|
2024-04-23 04:15:52
|
|
C
|
ca_on_niagara_on_the_lake
|
2024-04-23 04:02:55
|
2024-04-23 04:02:55
|
|
C
|
ca_on_north_dumfries
|
2024-04-23 04:28:11
|
2024-04-23 04:28:11
|
|
D>
04:19:59 WARNING pupa: validation of CanadianPerson bf54b440-0128-11ef-9f20-6a82ce95162d failed: 1 validation errors:
Value 'Sean Oâ\x80\x99Meara' for field '<obj>.name' does not match regular expression 'regex.Regex('\\A(?!(?:Chair|Commissioner|Conseiller|Councillor|Deputy|Dr|Hon|M|Maire|Mayor|Miss|Mme|Mr|Mrs|Ms|Regional|Warden)\\b)(?:(?:(?:\\p{Lu}\\.)+|\\p{Lu}+|(?:Jr|Rev|Sr|St)\\.|da|de|den|der|la|van|von|[("](?:\\p{Lu}+|\\p{Lu}\\p{Ll}*(?:-\\p{Lu}\\p{Ll}*)*)[)"]|(?:D\'|d\'|De|de|Des|Di|Du|L\'|La|Le|Mac|Mc|O\'|San|Van|Vander?|vanden)?\\p{Lu}\\p{Ll}+|\\p{Lu}\\p{Ll}+Anne?|Marie\\p{Lu}\\p{Ll}+|Ch\'ng|Prud\'homme|D!ONNE|IsaBelle|Ya\'ara)(?:\'|-| - | ))+(?:(?:\\p{Lu}\\.)+|\\p{Lu}+|(?:Jr|Rev|Sr|St)\\.|da|de|den|der|la|van|von|[("](?:\\p{Lu}+|\\p{Lu}\\p{Ll}*(?:-\\p{Lu}\\p{Ll}*)*)[)"]|(?:D\'|d\'|De|de|Des|Di|Du|L\'|La|Le|Mac|Mc|O\'|San|Van|Vander?|vanden)?\\p{Lu}\\p{Ll}+|\\p{Lu}\\p{Ll}+Anne?|Marie\\p{Lu}\\p{Ll}+|Ch\'ng|Prud\'homme|D!ONNE|IsaBelle|Ya\'ara)\\Z', flags=regex.V0)'
04:19:59 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3524001/legislature yet
|
ca_on_oakville
|
|
2024-04-23 04:19:59
|
Value 'Sean Oâ\x80\x99Meara' for field '<obj>.name' does not match regular expression 'regex.Regex('\\A(?!(?:Chair|Commissio…
Traceback (most recent call last):
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 175, in validate
validator.validate(self.as_dict(), schema)
File "/app/.heroku/python/lib/python3.8/site-packages/validictory/validator.py", line 620, in validate
raise MultipleValidationError(self._errors)
validictory.validator.MultipleValidationError: 1 validation errors:
Value 'Sean Oâ\x80\x99Meara' for field '<obj>.name' does not match regular expression 'regex.Regex('\\A(?!(?:Chair|Commissioner|Conseiller|Councillor|Deputy|Dr|Hon|M|Maire|Mayor|Miss|Mme|Mr|Mrs|Ms|Regional|Warden)\\b)(?:(?:(?:\\p{Lu}\\.)+|\\p{Lu}+|(?:Jr|Rev|Sr|St)\\.|da|de|den|der|la|van|von|[("](?:\\p{Lu}+|\\p{Lu}\\p{Ll}*(?:-\\p{Lu}\\p{Ll}*)*)[)"]|(?:D\'|d\'|De|de|Des|Di|Du|L\'|La|Le|Mac|Mc|O\'|San|Van|Vander?|vanden)?\\p{Lu}\\p{Ll}+|\\p{Lu}\\p{Ll}+Anne?|Marie\\p{Lu}\\p{Ll}+|Ch\'ng|Prud\'homme|D!ONNE|IsaBelle|Ya\'ara)(?:\'|-| - | ))+(?:(?:\\p{Lu}\\.)+|\\p{Lu}+|(?:Jr|Rev|Sr|St)\\.|da|de|den|der|la|van|von|[("](?:\\p{Lu}+|\\p{Lu}\\p{Ll}*(?:-\\p{Lu}\\p{Ll}*)*)[)"]|(?:D\'|d\'|De|de|Des|Di|Du|L\'|La|Le|Mac|Mc|O\'|San|Van|Vander?|vanden)?\\p{Lu}\\p{Ll}+|\\p{Lu}\\p{Ll}+Anne?|Marie\\p{Lu}\\p{Ll}+|Ch\'ng|Prud\'homme|D!ONNE|IsaBelle|Ya\'ara)\\Z', flags=regex.V0)'
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 104, in do_scrape
self.save_object(obj)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 89, in save_object
raise ve
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 85, in save_object
obj.validate()
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 177, in validate
raise ScrapeValueError('validation of {} {} failed: {}'.format(
pupa.exceptions.ScrapeValueError: validation of CanadianPerson bf54b440-0128-11ef-9f20-6a82ce95162d failed: 1 validation errors:
Value 'Sean Oâ\x80\x99Meara' for field '<obj>.name' does not match regular expression 'regex.Regex('\\A(?!(?:Chair|Commissioner|Conseiller|Councillor|Deputy|Dr|Hon|M|Maire|Mayor|Miss|Mme|Mr|Mrs|Ms|Regional|Warden)\\b)(?:(?:(?:\\p{Lu}\\.)+|\\p{Lu}+|(?:Jr|Rev|Sr|St)\\.|da|de|den|der|la|van|von|[("](?:\\p{Lu}+|\\p{Lu}\\p{Ll}*(?:-\\p{Lu}\\p{Ll}*)*)[)"]|(?:D\'|d\'|De|de|Des|Di|Du|L\'|La|Le|Mac|Mc|O\'|San|Van|Vander?|vanden)?\\p{Lu}\\p{Ll}+|\\p{Lu}\\p{Ll}+Anne?|Marie\\p{Lu}\\p{Ll}+|Ch\'ng|Prud\'homme|D!ONNE|IsaBelle|Ya\'ara)(?:\'|-| - | ))+(?:(?:\\p{Lu}\\.)+|\\p{Lu}+|(?:Jr|Rev|Sr|St)\\.|da|de|den|der|la|van|von|[("](?:\\p{Lu}+|\\p{Lu}\\p{Ll}*(?:-\\p{Lu}\\p{Ll}*)*)[)"]|(?:D\'|d\'|De|de|Des|Di|Du|L\'|La|Le|Mac|Mc|O\'|San|Van|Vander?|vanden)?\\p{Lu}\\p{Ll}+|\\p{Lu}\\p{Ll}+Anne?|Marie\\p{Lu}\\p{Ll}+|Ch\'ng|Prud\'homme|D!ONNE|IsaBelle|Ya\'ara)\\Z', flags=regex.V0)'
|
D>
04:03:11 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3518013/legislature yet
|
ca_on_oshawa
|
|
2024-04-23 04:03:11
|
scrapelib.HTTPError: 404 while retrieving https://www.oshawa.ca/city-hall/city-council-members.asp
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_oshawa/people.py", line 9, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.oshawa.ca/city-hall/city-council-members.asp
|
D>
04:42:14 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3506008/legislature yet
|
ca_on_ottawa
|
|
2024-04-23 04:42:14
|
KeyError: 'name'
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 394, in scrape
if not self.is_valid_row(row):
File "/app/scrapers/utils.py", line 348, in is_valid_row
return row["name"] not in empty
KeyError: 'name'
|
D>
04:41:02 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/cd:3521/legislature yet
|
ca_on_peel
|
|
2024-04-23 04:41:02
|
scrapelib.HTTPError: 404 while retrieving https://data.peelregion.ca/media/43505/wards1822_csv.csv
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://data.peelregion.ca/media/43505/wards1822_csv.csv
|
D>
04:41:00 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3518001/legislature yet
|
ca_on_pickering
|
|
2024-04-23 04:41:00
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_pickering/people.py", line 17, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
C
|
ca_on_richmond_hill
|
2024-04-23 04:03:08
|
2024-04-23 04:03:08
|
|
D>
04:20:22 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/province:on/school yet
|
ca_on_school_boards_english_public
|
|
2024-04-23 04:20:22
|
KeyError: 'district name'
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 400, in scrape
elif row[key] in corrections:
KeyError: 'district name'
|
C
|
ca_on_st_catharines
|
2024-04-23 04:15:56
|
2024-04-23 04:15:56
|
|
D>
04:41:01 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3558004/legislature yet
|
ca_on_thunder_bay
|
|
2024-04-23 04:41:01
|
requests.exceptions.SSLError: HTTPSConnectionPool(host='www.thunderbay.ca', port=443): Max retries exceeded with url: /en/ci…
Traceback (most recent call last):
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/connectionpool.py", line 715, in urlopen
httplib_response = self._make_request(
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/connectionpool.py", line 404, in _make_request
self._validate_conn(conn)
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/connectionpool.py", line 1058, in _validate_conn
conn.connect()
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/connection.py", line 419, in connect
self.sock = ssl_wrap_socket(
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/util/ssl_.py", line 449, in ssl_wrap_socket
ssl_sock = _ssl_wrap_socket_impl(
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/util/ssl_.py", line 493, in _ssl_wrap_socket_impl
return ssl_context.wrap_socket(sock, server_hostname=server_hostname)
File "/app/.heroku/python/lib/python3.8/ssl.py", line 500, in wrap_socket
return self.sslsocket_class._create(
File "/app/.heroku/python/lib/python3.8/ssl.py", line 1073, in _create
self.do_handshake()
File "/app/.heroku/python/lib/python3.8/ssl.py", line 1342, in do_handshake
self._sslobj.do_handshake()
ssl.SSLError: [SSL: DH_KEY_TOO_SMALL] dh key too small (_ssl.c:1131)
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/app/.heroku/python/lib/python3.8/site-packages/requests/adapters.py", line 486, in send
resp = conn.urlopen(
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/connectionpool.py", line 799, in urlopen
retries = retries.increment(
File "/app/.heroku/python/lib/python3.8/site-packages/urllib3/util/retry.py", line 592, in increment
raise MaxRetryError(_pool, url, error or ResponseError(cause))
urllib3.exceptions.MaxRetryError: HTTPSConnectionPool(host='www.thunderbay.ca', port=443): Max retries exceeded with url: /en/city-hall/mayor-and-council.aspx (Caused by SSLError(SSLError(1, '[SSL: DH_KEY_TOO_SMALL] dh key too small (_ssl.c:1131)')))
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_thunder_bay/people.py", line 10, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 579, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 404, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 232, in request
return super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 122, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 589, in request
resp = self.send(prep, **send_kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 703, in send
r = adapter.send(request, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/adapters.py", line 517, in send
raise SSLError(e, request=request)
requests.exceptions.SSLError: HTTPSConnectionPool(host='www.thunderbay.ca', port=443): Max retries exceeded with url: /en/city-hall/mayor-and-council.aspx (Caused by SSLError(SSLError(1, '[SSL: DH_KEY_TOO_SMALL] dh key too small (_ssl.c:1131)')))
|
C
|
ca_on_toronto
|
2024-04-23 04:00:29
|
2024-04-23 04:00:30
|
|
C
|
ca_on_uxbridge
|
2024-04-23 04:19:43
|
2024-04-23 04:19:43
|
|
D>
04:19:57 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3519028/legislature yet
|
ca_on_vaughan
|
|
2024-04-23 04:19:57
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_vaughan/people.py", line 16, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
C
|
ca_on_waterloo
|
2024-04-23 04:00:37
|
2024-04-23 04:00:37
|
|
D>
14:59:42 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/cd:3530/legislature yet
|
ca_on_waterloo_region
|
|
2024-04-23 14:59:42
|
KeyError: 'district name'
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 399, in scrape
row[key] = corrections(row[key])
KeyError: 'district name'
|
D>
04:43:33 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3526032/legislature yet
|
ca_on_welland
|
|
2024-04-23 04:43:33
|
scrapelib.HTTPError: 404 while retrieving https://niagaraopendata.ca/dataset/b38e2f85-bcd4-43fd-95d5-f513919514d9/resource/5…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://niagaraopendata.ca/dataset/b38e2f85-bcd4-43fd-95d5-f513919514d9/resource/590c9110-01f3-4256-8ac1-9c5cbeca88c5/download/city-of-welland-mayor-and-council-members.csv
|
D>
|
ca_on_wellesley
|
2024-03-19 04:38:26
|
2024-04-23 04:26:58
|
AssertionError
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_wellesley/people.py", line 21, in scrape
assert len(members) == 5
AssertionError
|
D>
04:25:26 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:3518009/legislature yet
|
ca_on_whitby
|
|
2024-04-23 04:25:26
|
scrapelib.HTTPError: 404 while retrieving https://www.whitby.ca/Common/PageNotFound.aspx?aspxerrorpath=/en/town-hall/council…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_on_whitby/people.py", line 10, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.whitby.ca/Common/PageNotFound.aspx?aspxerrorpath=/en/town-hall/council-members.aspx
|
C
|
ca_on_whitchurch_stouffville
|
2024-04-23 04:44:54
|
2024-04-23 04:44:54
|
|
D>
|
ca_on_windsor
|
2023-06-05 04:00:27
|
2024-04-23 04:20:24
|
scrapelib.HTTPError: 404 while retrieving https://www.citywindsor.ca/opendata/Lists/OpenData/Attachments/33/City%20Windsor%2…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.citywindsor.ca/opendata/Lists/OpenData/Attachments/33/City%20Windsor%20Elected%20Officials.csv
|
C
|
ca_pe
|
2024-04-23 04:27:53
|
2024-04-23 04:27:53
|
|
D>
04:42:18 WARNING scrapelib: sleeping for 10 seconds before retry
04:42:28 WARNING scrapelib: sleeping for 20 seconds before retry
04:42:48 WARNING scrapelib: sleeping for 40 seconds before retry
04:43:28 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:1102075/legislature yet
|
ca_pe_charlottetown
|
|
2024-04-23 04:43:28
|
scrapelib.HTTPError: 403 while retrieving https://www.charlottetown.ca/mayor___council/city_council/meet_my_councillor
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_pe_charlottetown/people.py", line 11, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 403 while retrieving https://www.charlottetown.ca/mayor___council/city_council/meet_my_councillor
|
C
|
ca_qc
|
2024-04-23 04:13:19
|
2024-04-23 04:13:19
|
|
D>
|
ca_qc_beaconsfield
|
2024-03-27 04:04:06
|
2024-04-23 04:16:02
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_beaconsfield/people.py", line 12, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:03:16 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2458007/legislature yet
|
ca_qc_brossard
|
|
2024-04-23 04:03:16
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_brossard/people.py", line 18, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:16:06 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2466058/legislature yet
|
ca_qc_cote_saint_luc
|
|
2024-04-23 04:16:06
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_cote_saint_luc/people.py", line 13, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:03:27 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2466142/legislature yet
|
ca_qc_dollard_des_ormeaux
|
|
2024-04-23 04:03:27
|
scrapelib.HTTPError: 404 while retrieving https://ville.ddo.qc.ca/en/my-municipality/members-council
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_dollard_des_ormeaux/people.py", line 9, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://ville.ddo.qc.ca/en/my-municipality/members-council
|
C
|
ca_qc_dorval
|
2024-04-23 04:27:58
|
2024-04-23 04:27:58
|
|
D>
04:03:24 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2481017/legislature yet
|
ca_qc_gatineau
|
|
2024-04-23 04:03:24
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_gatineau/people.py", line 20, in scrape
p = Person(primary_org="legislature", name=names[0], district="Gatineau", role="Maire")
IndexError: list index out of range
|
D>
04:41:03 WARNING scrapelib: sleeping for 10 seconds before retry
04:41:13 WARNING scrapelib: sleeping for 20 seconds before retry
04:41:33 WARNING scrapelib: sleeping for 40 seconds before retry
04:42:13 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2466102/legislature yet
|
ca_qc_kirkland
|
|
2024-04-23 04:42:13
|
scrapelib.HTTPError: 403 while retrieving https://www.ville.kirkland.qc.ca/portrait-municipal/conseil-municipal/elus-municip…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_kirkland/people.py", line 11, in scrape
page = self.lxmlize(COUNCIL_PAGE, "iso-8859-1")
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 403 while retrieving https://www.ville.kirkland.qc.ca/portrait-municipal/conseil-municipal/elus-municipaux
|
C
|
ca_qc_laval
|
2024-04-23 18:57:07
|
2024-04-23 18:57:07
|
|
D>
04:28:15 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2425213/legislature yet
|
ca_qc_levis
|
|
2024-04-23 04:28:15
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_levis/people.py", line 15, in scrape
position, name = person.xpath("./h2/text()")[0].replace("–", "-").split(" - ")
IndexError: list index out of range
|
D>
04:28:07 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2458227/legislature yet
|
ca_qc_longueuil
|
|
2024-04-23 04:28:07
|
scrapelib.HTTPError: 404 while retrieving https://www.longueuil.quebec/fr/conseil-ville
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_longueuil/people.py", line 10, in scrape
page = self.lxmlize(COUNCIL_PAGE, "utf-8")
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.longueuil.quebec/fr/conseil-ville
|
D>
04:23:21 WARNING scrapelib: got Exceeded 30 redirects. sleeping for 10 seconds before retry
04:23:49 WARNING scrapelib: got Exceeded 30 redirects. sleeping for 20 seconds before retry
04:24:27 WARNING scrapelib: got Exceeded 30 redirects. sleeping for 40 seconds before retry
04:25:24 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2467045/legislature yet
|
ca_qc_mercier
|
|
2024-04-23 04:25:24
|
requests.exceptions.TooManyRedirects: Exceeded 30 redirects.
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_mercier/people.py", line 12, in scrape
page = self.lxmlize(COUNCIL_PAGE, user_agent=CUSTOM_USER_AGENT, encoding="windows-1252")
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 579, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 404, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 232, in request
return super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 175, in request
raise exception_raised
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 122, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 589, in request
resp = self.send(prep, **send_kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 725, in send
history = [resp for resp in gen]
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 725, in <listcomp>
history = [resp for resp in gen]
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 191, in resolve_redirects
raise TooManyRedirects(
requests.exceptions.TooManyRedirects: Exceeded 30 redirects.
|
D>
04:03:18 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2466023/legislature yet
|
ca_qc_montreal
|
|
2024-04-23 04:03:18
|
scrapelib.HTTPError: 404 while retrieving https://donnees.montreal.ca/dataset/381d74ca-dadd-459f-95c9-db255b5f4480/resource/…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/utils.py", line 379, in scrape
reader = self.csv_reader(
File "/app/scrapers/utils.py", line 227, in csv_reader
response = self.get(url, **kwargs)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://donnees.montreal.ca/dataset/381d74ca-dadd-459f-95c9-db255b5f4480/resource/ce1315a3-50ee-48d0-a0f0-9bcc15f65643/download/listeelusmontreal.csv
|
D>
04:42:17 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2466007/legislature yet
|
ca_qc_montreal_est
|
|
2024-04-23 04:42:17
|
scrapelib.HTTPError: 404 while retrieving https://ville.montreal-est.qc.ca/histoire-et-patrimoine/histoire-de-montreal-est/c…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_montreal_est/people.py", line 10, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://ville.montreal-est.qc.ca/histoire-et-patrimoine/histoire-de-montreal-est/conseil-municipal/conseils-municipaux/
|
D>
04:03:21 WARNING pupa: validation of CanadianPerson 6c6e931a-0126-11ef-9f20-6a82ce95162d failed: 1 validation errors:
Value 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAZAAAAGQAQAAAACoxAthAAAAAnRSTlMAAHaTzTgAAAAqSURBVHja7cExAQAAAMKg9U/tbwagAAAAAAAAAAAAAAAAAAAAAAAAAIA3T7AAAZRBGFwAAAAASUVORK5CYII=' for field '<obj>.image' does not match regular expression '\A(?:(?:ftp|https?)://|\Z)'
|
ca_qc_pointe_claire
|
2024-03-12 04:56:49
|
2024-04-23 04:03:21
|
Value 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAZAAAAGQAQAAAACoxAthAAAAAnRSTlMAAHaTzTgAAAAqSURBVHja7cExAQAAAMKg9U/tbwa…
Traceback (most recent call last):
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 175, in validate
validator.validate(self.as_dict(), schema)
File "/app/.heroku/python/lib/python3.8/site-packages/validictory/validator.py", line 620, in validate
raise MultipleValidationError(self._errors)
validictory.validator.MultipleValidationError: 1 validation errors:
Value 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAZAAAAGQAQAAAACoxAthAAAAAnRSTlMAAHaTzTgAAAAqSURBVHja7cExAQAAAMKg9U/tbwagAAAAAAAAAAAAAAAAAAAAAAAAAIA3T7AAAZRBGFwAAAAASUVORK5CYII=' for field '<obj>.image' does not match regular expression '\A(?:(?:ftp|https?)://|\Z)'
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 104, in do_scrape
self.save_object(obj)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 89, in save_object
raise ve
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 85, in save_object
obj.validate()
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 177, in validate
raise ScrapeValueError('validation of {} {} failed: {}'.format(
pupa.exceptions.ScrapeValueError: validation of CanadianPerson 6c6e931a-0126-11ef-9f20-6a82ce95162d failed: 1 validation errors:
Value 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAZAAAAGQAQAAAACoxAthAAAAAnRSTlMAAHaTzTgAAAAqSURBVHja7cExAQAAAMKg9U/tbwagAAAAAAAAAAAAAAAAAAAAAAAAAIA3T7AAAZRBGFwAAAAASUVORK5CYII=' for field '<obj>.image' does not match regular expression '\A(?:(?:ftp|https?)://|\Z)'
|
D>
04:03:13 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2423027/legislature yet
|
ca_qc_quebec
|
|
2024-04-23 04:03:13
|
pupa.exceptions.UnresolvedIdError: cannot resolve pseudo id to Post: ~{"label": "Saules\u2014Les M\u00e9andres", "organizati…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 307, in do_handle
report['import'] = self.do_import(juris, args)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 211, in do_import
report.update(membership_importer.import_directory(datadir))
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 190, in import_directory
return self.import_data(json_stream())
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 227, in import_data
obj_id, what = self.import_item(data)
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 247, in import_item
data = self.prepare_for_db(data)
File "/app/.heroku/src/pupa/pupa/importers/memberships.py", line 50, in prepare_for_db
data['post_id'] = self.post_importer.resolve_json_id(data['post_id'])
File "/app/.heroku/src/pupa/pupa/importers/base.py", line 165, in resolve_json_id
raise UnresolvedIdError(errmsg)
pupa.exceptions.UnresolvedIdError: cannot resolve pseudo id to Post: ~{"label": "Saules\u2014Les M\u00e9andres", "organization__classification": "legislature", "role": "Conseiller"}
|
D>
04:00:27 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2494068/legislature yet
|
ca_qc_saguenay
|
|
2024-04-23 04:00:27
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_saguenay/people.py", line 14, in scrape
name = mayor_page.xpath('//span/text()[contains(., "maire")]')[0].split(", ", 1)[0]
IndexError: list index out of range
|
D>
04:21:38 WARNING scrapelib: sleeping for 10 seconds before retry
04:21:49 WARNING scrapelib: sleeping for 20 seconds before retry
04:22:09 WARNING scrapelib: sleeping for 40 seconds before retry
|
ca_qc_sainte_anne_de_bellevue
|
2023-10-24 04:04:32
|
2024-04-23 04:22:49
|
scrapelib.HTTPError: 403 while retrieving https://ville.sainte-anne-de-bellevue.qc.ca/fr/199/elus-municipaux
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_sainte_anne_de_bellevue/people.py", line 11, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 403 while retrieving https://ville.sainte-anne-de-bellevue.qc.ca/fr/199/elus-municipaux
|
C
|
ca_qc_saint_jean_sur_richelieu
|
2024-04-23 04:20:18
|
2024-04-23 04:20:18
|
|
D>
04:27:59 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2475017/legislature yet
|
ca_qc_saint_jerome
|
|
2024-04-23 04:27:59
|
Exception: No email node in b'<div class=" inner_member">\n <div class="portrait_single">\n <img width="819" hei…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_saint_jerome/people.py", line 31, in scrape
p.add_contact("email", self.get_email(councillor))
File "/app/scrapers/utils.py", line 141, in get_email
raise Exception("No email node in {}".format(etree.tostring(node)))
Exception: No email node in b'<div class=" inner_member">\n <div class="portrait_single">\n <img width="819" height="1024" src="data:image/svg+xml,%3Csvg%20xmlns=\'http://www.w3.org/2000/svg\'%20viewBox=\'0%200%20819%201024\'%3E%3C/svg%3E" class="single_pic wp-post-image" alt="Marc Bourcier" decoding="async" fetchpriority="high" data-lazy-srcset="https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-819x1024.jpg 819w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-240x300.jpg 240w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-768x960.jpg 768w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-1229x1536.jpg 1229w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-500x625.jpg 500w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-800x1000.jpg 800w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-1280x1600.jpg 1280w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier.jpg 1536w" data-lazy-sizes="(max-width: 819px) 100vw, 819px" data-lazy-src="https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-819x1024.jpg"/><noscript><img width="819" height="1024" src="https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-819x1024.jpg" class="single_pic wp-post-image" alt="Marc Bourcier" decoding="async" fetchpriority="high" srcset="https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-819x1024.jpg 819w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-240x300.jpg 240w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-768x960.jpg 768w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-1229x1536.jpg 1229w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-500x625.jpg 500w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-800x1000.jpg 800w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier-1280x1600.jpg 1280w, https://www.vsj.ca/wp-content/uploads/2019/11/0_Marc_Bourcier.jpg 1536w" sizes="(max-width: 819px) 100vw, 819px"/></noscript> </div>\n <div class="info_member">\n <div class="district">\n Maire </div>\n <h2 class="entry-title">Marc Bourcier</h2>\n <div class="phone">\n 450 436-1512, poste 3021 </div>\n \n <div class="wp-block-list mail">\n <a class="space-a" href="https://www.vsj.ca/cdn-cgi/l/email-protection#3d505c544f54587d4b4e57135e5c"><span class="__cf_email__" data-cfemail="5e333f372c373b1e282d34703d3f">[email protected]</span></a>\n </div>\n <div class="wp-block-list wysiwyg">\n<ul><li>Président du comité exécutif</li><li>Membre d’office de tous les comités ainsi que toutes les commissions du conseil</li><li>Administrateur de la Municipalité régionale de comté de la Rivière-du-Nord (MRC)</li><li>Vice-Président de la Régie intermunicipale de l’Aréna régional de la Rivière-du-Nord</li></ul>\n</div> </div>\n </div> \n '
|
D>
|
ca_qc_senneville
|
2022-09-06 04:41:24
|
2024-04-23 04:28:02
|
scrapelib.HTTPError: 404 while retrieving https://www.senneville.ca/fr/7/conseil-municipal
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_senneville/people.py", line 9, in scrape
page = self.lxmlize(COUNCIL_PAGE)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 404 while retrieving https://www.senneville.ca/fr/7/conseil-municipal
|
D>
04:43:30 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2443027/legislature yet
|
ca_qc_sherbrooke
|
|
2024-04-23 04:43:30
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_sherbrooke/people.py", line 12, in scrape
assert len(councillors), "No councillors found"
AssertionError: No councillors found
|
D>
04:43:35 WARNING scrapelib: sleeping for 10 seconds before retry
04:43:45 WARNING scrapelib: sleeping for 20 seconds before retry
04:44:06 WARNING scrapelib: sleeping for 40 seconds before retry
04:44:46 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2464008/legislature yet
|
ca_qc_terrebonne
|
|
2024-04-23 04:44:46
|
scrapelib.HTTPError: 500 while retrieving https://terrebonne.ca/fr/10/Conseil_municipal
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_terrebonne/people.py", line 9, in scrape
page = self.lxmlize(COUNCIL_PAGE, "utf-8")
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 602, in request
raise HTTPError(resp)
scrapelib.HTTPError: 500 while retrieving https://terrebonne.ca/fr/10/Conseil_municipal
|
D>
04:19:45 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:2437067/legislature yet
|
ca_qc_trois_rivieres
|
|
2024-04-23 04:19:45
|
AssertionError: No councillors found
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_trois_rivieres/people.py", line 16, in scrape
assert len(members), "No councillors found"
AssertionError: No councillors found
|
D>
|
ca_qc_westmount
|
2023-03-01 04:14:28
|
2024-04-23 04:16:18
|
Exception: No email node in b'<div class="vc_row wpb_row vc_row-fluid"><div class="wpb_column vc_column_container vc_col-sm-…
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_qc_westmount/people.py", line 29, in scrape
p.add_contact("email", self.get_email(councillor))
File "/app/scrapers/utils.py", line 141, in get_email
raise Exception("No email node in {}".format(etree.tostring(node)))
Exception: No email node in b'<div class="vc_row wpb_row vc_row-fluid"><div class="wpb_column vc_column_container vc_col-sm-4"><div class="vc_column-inner"><div class="wpb_wrapper">\n\t<div class="wpb_single_image wpb_content_element vc_align_center">\n\t\t\n\t\t<figure class="wpb_wrapper vc_figure">\n\t\t\t<div class="vc_single_image-wrapper vc_box_border_grey"><img loading="lazy" decoding="async" width="310" height="434" src="https://westmount.org/wp-content/uploads/2015/03/christina_m_smith_reg.jpg" class="vc_single_image-img attachment-full" alt="" title="christina_m_smith_reg" srcset="https://westmount.org/wp-content/uploads/2015/03/christina_m_smith_reg.jpg 310w, https://westmount.org/wp-content/uploads/2015/03/christina_m_smith_reg-214x300.jpg 214w" sizes="(max-width: 310px) 100vw, 310px"/></div>\n\t\t</figure>\n\t</div>\n<div class="vc_btn3-container vc_btn3-inline"><a class="vc_general vc_btn3 vc_btn3-size-md vc_btn3-shape-square vc_btn3-style-modern vc_btn3-color-grey" href="https://westmount.org/wp-content/uploads/2015/03/christina_smith_media.jpg" title="" target="_blank">Photo média</a></div></div></div></div><div class="wpb_column vc_column_container vc_col-sm-8"><div class="vc_column-inner"><div class="wpb_wrapper">\n\t<div class="wpb_text_column wpb_content_element ">\n\t\t<div class="wpb_wrapper">\n\t\t\t<h4>Christina M. Smith</h4>\n<p><strong>Mairesse de la Ville de Westmount</strong><br/>\nLa mairesse Christina M. Smith fût élue conseillère municipal en 2013 et mairesse de la Ville de Westmount en 2017 et en 2021.<br/>\nVice-présidente de la Commission de la sécurité publique de l’Agglomération de Montréal.</p>\n<ul>\n<li>Téléphone : <a href="https://westmount.org/conseil-municipal/callto:15149895240">514 989-5240</a></li>\n<li>Télécopieur<a name="patrick-martin"/> : 514 989-5481</li>\n</ul>\n\n\t\t</div>\n\t</div>\n<div class="vc_empty_space" style="height: 20px"><span class="vc_empty_space_inner"/></div><div class="vc_tta-container" data-vc-action="collapseAll"><div class="vc_general vc_tta vc_tta-accordion vc_tta-color-white vc_tta-style-flat vc_tta-shape-square vc_tta-o-shape-group vc_tta-controls-align-left vc_tta-o-all-clickable"><div class="vc_tta-panels-container"><div class="vc_tta-panels"><div class="vc_tta-panel" id="1493140680948-48126fe2-9e0e" data-vc-content=".vc_tta-panel-body"><div class="vc_tta-panel-heading"><h4 class="vc_tta-panel-title vc_tta-controls-icon-position-right"><a href="https://westmount.org/conseil-municipal/#1493140680948-48126fe2-9e0e" data-vc-accordion="" data-vc-container=".vc_tta-container"><span class="vc_tta-title-text">Biographie</span><i class="vc_tta-controls-icon vc_tta-controls-icon-plus"/></a></h4></div><div class="vc_tta-panel-body">\n\t<div class="wpb_text_column wpb_content_element ">\n\t\t<div class="wpb_wrapper">\n\t\t\t<p>Christina M. Smith a été élue au conseil municipal de Westmount le 3 novembre 2013 en tant que conseillère du district 5. Durant ce mandat, elle a été également commissaire à l’administration. En avril 2017, Christina Smith a été nommée mairesse intérimaire de Westmount par le Conseil lorsque le maire Peter Trent a pris sa retraite. Le 5 novembre 2017, Christina Smith a été élue mairesse de la Ville.  Durant son mandat de 2017 à 2021, elle a été membre de la Commission des finances de l’Agglomération de Montréal, de la Commission du développement économique et du Comité d’audit. En novembre 2021, Madame Smith a été réélue mairesse de Westmount pour un second mandat. Elle est également vice-présidente de la Commission de la sécurité publique auprès de l’Agglomération de Montréal. La mairesse Smith est également membre de l’exécutif de l’Association des municipalités de banlieue.</p>\n<p>Avant d’entrer dans la politique municipale, Christina était directrice de l’industrie et des affaires gouvernementales pour Coca-Cola. Elle a également été conseillère politique auprès du ministre fédéral des Affaires intergouvernementales. Impliquée dans de nombreuses organisations communautaires, elle croit à l’engagement civique afin que tous les résidents bénéficient de nombreux programmes et services.</p>\n<p>Christina est titulaire d’un baccalauréat en sciences politiques de l’Université Bishop’s. Elle et son mari ont trois jeunes enfants qui apprécient bon nombre des programmes et activités sportives de Westmount.</p>\n\n\t\t</div>\n\t</div>\n</div></div></div></div></div></div></div></div></div></div>'
|
D>
|
ca_sk
|
2024-04-23 04:26:54
|
2024-04-23 08:36:28
|
SystemExit: 1
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_sk/people.py", line 18, in scrape
page = self.lxmlize(url)
File "/app/scrapers/utils.py", line 192, in lxmlize
response = self.get(url, cookies=cookies)
File "/app/scrapers/utils.py", line 184, in get
return super().get(*args, verify=SSL_VERIFY, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/requests/sessions.py", line 602, in get
return self.request("GET", url, **kwargs)
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 579, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 404, in request
resp = super().request(
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 231, in request
self._throttle()
File "/app/.heroku/python/lib/python3.8/site-packages/scrapelib/__init__.py", line 188, in _throttle
time.sleep(diff)
File "/app/.heroku/python/lib/python3.8/site-packages/gunicorn/workers/base.py", line 196, in handle_abort
sys.exit(1)
SystemExit: 1
|
D>
04:25:51 WARNING pupa: could not save RunPlan, no successful runs of ocd-jurisdiction/country:ca/csd:4706027/legislature yet
|
ca_sk_regina
|
|
2024-04-23 04:25:51
|
IndexError: list index out of range
Traceback (most recent call last):
File "/app/reports/utils.py", line 71, in scrape_people
report.report = subcommand.handle(args, other)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 260, in handle
return self.do_handle(args, other, juris)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 305, in do_handle
report['scrape'] = self.do_scrape(juris, args, scrapers)
File "/app/.heroku/src/pupa/pupa/cli/commands/update.py", line 173, in do_scrape
report[scraper_name] = scraper.do_scrape(**scrape_args)
File "/app/.heroku/src/pupa/pupa/scrape/base.py", line 99, in do_scrape
for obj in self.scrape(**kwargs) or []:
File "/app/scrapers/ca_sk_regina/people.py", line 25, in scrape
yield self.mayor_data(mayor_url)
File "/app/scrapers/ca_sk_regina/people.py", line 61, in mayor_data
phone_path = page.xpath('//div[@class="councillor__contact"]//ul/li/a/@href[contains(., "306")]')[0]
IndexError: list index out of range
|
C
|
ca_sk_saskatoon
|
2024-04-23 04:44:49
|
2024-04-23 04:44:49
|
|