Don't wait for networkidle, if it doesn't get that far but 'load' does
This commit is contained in:
parent
2fa3f71631
commit
3c6cb2c42c
1 changed files with 13 additions and 4 deletions
|
|
@ -11,7 +11,10 @@ from dataclasses import dataclass
|
||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
from urllib.parse import urljoin, urldefrag, urlparse
|
from urllib.parse import urljoin, urldefrag, urlparse
|
||||||
|
|
||||||
from playwright.async_api import async_playwright
|
from playwright.async_api import (
|
||||||
|
async_playwright,
|
||||||
|
TimeoutError as PlaywrightTimeoutError,
|
||||||
|
)
|
||||||
|
|
||||||
from .ensure_playwright import ensure_chromium_installed
|
from .ensure_playwright import ensure_chromium_installed
|
||||||
|
|
||||||
|
|
@ -528,8 +531,14 @@ async def crawl_and_generate_csp(
|
||||||
page.on("response", on_response)
|
page.on("response", on_response)
|
||||||
|
|
||||||
try:
|
try:
|
||||||
resp = await page.goto(
|
resp = await page.goto(url, wait_until="load", timeout=timeout_ms)
|
||||||
url, wait_until="networkidle", timeout=timeout_ms
|
try:
|
||||||
|
await page.wait_for_load_state(
|
||||||
|
"networkidle", timeout=min(5000, timeout_ms)
|
||||||
|
)
|
||||||
|
except PlaywrightTimeoutError:
|
||||||
|
notes.append(
|
||||||
|
f"Timed out waiting for networkidle on {url}; continuing after load anyway."
|
||||||
)
|
)
|
||||||
|
|
||||||
ct = ""
|
ct = ""
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue