From d0b42a1a46670072585299d5f50e204b20d73525 Mon Sep 17 00:00:00 2001 From: Alexei Date: Mon, 6 Jan 2025 13:05:16 -0500 Subject: [PATCH] Don't get current_url on unrecoverable exceptions Following up on 5211f67 --- crawler.py | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/crawler.py b/crawler.py index 92d5986..a89efc4 100755 --- a/crawler.py +++ b/crawler.py @@ -1052,9 +1052,7 @@ def crawl(self): num_visited += 1 except (MaxRetryError, ProtocolError, ReadTimeoutError) as ex: - self.logger.warning("Error loading %s:\n%s", - self.get_current_url() or domain, - str(ex)) + self.logger.warning("Error loading %s:\n%s", domain, str(ex)) self.restart_browser() except TimeoutException: