diff options
author | Dave Cottlehuber <dch@FreeBSD.org> | 2025-05-21 14:46:29 +0000 |
---|---|---|
committer | Dave Cottlehuber <dch@FreeBSD.org> | 2025-05-21 14:48:37 +0000 |
commit | e70ba49f6c0acfac90e0b822a6a0d908700d06c3 (patch) | |
tree | 1e6966bab814e4be90b9d68d87c114042f1fec2e /misc/py-aider-chat/files/patch-aider_scrape.py | |
parent | databases/couchdb3: update to 3.5.0 (diff) |
misc/py-aider-chat: update to 0.82.2
- ChangeLog https://aider.chat/HISTORY.html#aider-v0822
Diffstat (limited to 'misc/py-aider-chat/files/patch-aider_scrape.py')
-rw-r--r-- | misc/py-aider-chat/files/patch-aider_scrape.py | 16 |
1 files changed, 9 insertions, 7 deletions
diff --git a/misc/py-aider-chat/files/patch-aider_scrape.py b/misc/py-aider-chat/files/patch-aider_scrape.py index 969ff29d15f8..e52881317294 100644 --- a/misc/py-aider-chat/files/patch-aider_scrape.py +++ b/misc/py-aider-chat/files/patch-aider_scrape.py @@ -1,4 +1,4 @@ ---- aider/scrape.py.orig 2024-09-09 10:28:04 UTC +--- aider/scrape.py.orig 2025-04-14 23:24:32 UTC +++ aider/scrape.py @@ -15,57 +15,8 @@ def install_playwright(io): @@ -80,10 +80,12 @@ if not content: self.print_error(f"Failed to retrieve content from {url}") -@@ -130,56 +78,6 @@ class Scraper: +@@ -128,58 +76,6 @@ class Scraper: + ] + return any(re.search(pattern, content, re.IGNORECASE) for pattern in html_patterns) return False - - # Internals... +- +- # Internals... - def scrape_with_playwright(self, url): - import playwright # noqa: F401 - from playwright.sync_api import Error as PlaywrightError @@ -113,7 +115,8 @@ - try: - response = page.goto(url, wait_until="networkidle", timeout=5000) - except PlaywrightTimeoutError: -- self.print_error(f"Timeout while loading {url}") +- print(f"Page didn't quiesce, scraping content anyway: {url}") +- response = None - except PlaywrightError as e: - self.print_error(f"Error navigating to {url}: {str(e)}") - return None, None @@ -133,7 +136,6 @@ - browser.close() - - return content, mime_type -- + def scrape_with_httpx(self, url): import httpx - |