testsAndMisc/python_pkg/download_cats/generate_cats.py
Krzysztof kuhy Rudnicki bb6713eabb fix(lint): convert os.path to pathlib - remove PTH per-file ignores
- Converted os.path patterns to pathlib.Path in 15+ files
- os.path.join → Path /
- os.path.dirname → Path.parent
- os.path.exists → Path.exists()
- os.path.isfile → Path.is_file()
- os.path.abspath → Path.resolve()
- os.mkdir → Path.mkdir()
- os.listdir → Path.iterdir()
- os.getcwd → Path.cwd()
- os.replace → Path.replace()
- Updated function type hints to accept str | Path

Added PTH123 (open() vs Path.open()) to global ignores as stylistic preference
2025-11-30 23:03:03 +01:00

56 lines
1.4 KiB
Python

"""Download cat images from TheCatAPI.
Fetches cat images in batches and saves them to a local directory.
"""
import json
import logging
from pathlib import Path
import requests
_logger = logging.getLogger(__name__)
MAX_REQUESTS = 90
REQUEST_TIMEOUT = 30 # seconds
def _download_single_image(url: str) -> None:
"""Download and save a single image from URL.
Args:
url: The URL of the image to download.
"""
try:
# Get the image content
response = requests.get(url, timeout=REQUEST_TIMEOUT)
response.raise_for_status() # Raise an exception for HTTP errors
# Extract the image name from the URL
image_name = Path(url).name
image_path = Path("./CATS2/") / image_name
# Save the image to the directory
with open(image_path, "wb") as file:
file.write(response.content)
_logger.info("Saved %s as %s", url, image_path)
except requests.exceptions.RequestException:
_logger.exception("Failed to download %s", url)
requests_send = 0
while requests_send < MAX_REQUESTS:
res = requests.get(
"https://api.thecatapi.com/v1/images/search?limit=100&api_key=",
timeout=REQUEST_TIMEOUT,
)
requests_send += 1
response = json.loads(res.text)
urls = [cat.get("url") for cat in response]
Path("./CATS2").mkdir(parents=True, exist_ok=True)
for url in urls:
_download_single_image(url)