Tidy code automatically

This commit is contained in:
benoit74 2023-11-23 08:50:59 +01:00
parent 216ac09d8c
commit 79d5f8bc7b
No known key found for this signature in database
GPG Key ID: B89606434FC7B530

View File

@ -30,6 +30,7 @@ from zimscraperlib.uri import rebuild_uri
DEFAULT_USER_AGENT = "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/17.0 Safari/605.1.15" DEFAULT_USER_AGENT = "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/17.0 Safari/605.1.15"
class ProgressFileWatcher: class ProgressFileWatcher:
def __init__(self, output_dir, stats_path): def __init__(self, output_dir, stats_path):
self.crawl_path = output_dir / "crawl.json" self.crawl_path = output_dir / "crawl.json"
@ -153,9 +154,7 @@ def zimit(args=None):
type=int, type=int,
) )
parser.add_argument( parser.add_argument("--limit", help="Limit crawl to this number of pages", type=int)
"--limit", help="Limit crawl to this number of pages", type=int
)
parser.add_argument( parser.add_argument(
"--maxPageLimit", "--maxPageLimit",
@ -226,7 +225,7 @@ def zimit(args=None):
parser.add_argument( parser.add_argument(
"--userAgent", "--userAgent",
help="Override default user-agent with specified value ; --userAgentSuffix is still applied", help="Override default user-agent with specified value ; --userAgentSuffix is still applied",
default=DEFAULT_USER_AGENT default=DEFAULT_USER_AGENT,
) )
parser.add_argument( parser.add_argument(
@ -447,7 +446,11 @@ def check_url(url, user_agent, scope=None):
url = urllib.parse.urlparse(url) url = urllib.parse.urlparse(url)
try: try:
with requests.get( with requests.get(
url.geturl(), stream=True, allow_redirects=True, timeout=(12.2, 27), headers={"User-Agent": user_agent} url.geturl(),
stream=True,
allow_redirects=True,
timeout=(12.2, 27),
headers={"User-Agent": user_agent},
) as resp: ) as resp:
resp.raise_for_status() resp.raise_for_status()
except requests.exceptions.RequestException as exc: except requests.exceptions.RequestException as exc: