mirror of
https://github.com/kuhyx/testsAndMisc-archive.git
synced 2026-07-04 16:43:08 +02:00
- Convert f-string logging to % style (G004) - Convert open() to Path.open() (PTH123) - Remove G004 and PTH123 from global ignores in pyproject.toml
56 lines
1.4 KiB
Python
56 lines
1.4 KiB
Python
"""Download cat images from TheCatAPI.
|
|
|
|
Fetches cat images in batches and saves them to a local directory.
|
|
"""
|
|
|
|
import json
|
|
import logging
|
|
from pathlib import Path
|
|
|
|
import requests
|
|
|
|
_logger = logging.getLogger(__name__)
|
|
|
|
MAX_REQUESTS = 90
|
|
REQUEST_TIMEOUT = 30 # seconds
|
|
|
|
|
|
def _download_single_image(url: str) -> None:
|
|
"""Download and save a single image from URL.
|
|
|
|
Args:
|
|
url: The URL of the image to download.
|
|
"""
|
|
try:
|
|
# Get the image content
|
|
response = requests.get(url, timeout=REQUEST_TIMEOUT)
|
|
response.raise_for_status() # Raise an exception for HTTP errors
|
|
|
|
# Extract the image name from the URL
|
|
image_name = Path(url).name
|
|
image_path = Path("./CATS2/") / image_name
|
|
|
|
# Save the image to the directory
|
|
with image_path.open("wb") as file:
|
|
file.write(response.content)
|
|
|
|
_logger.info("Saved %s as %s", url, image_path)
|
|
|
|
except requests.exceptions.RequestException:
|
|
_logger.exception("Failed to download %s", url)
|
|
|
|
|
|
requests_send = 0
|
|
while requests_send < MAX_REQUESTS:
|
|
res = requests.get(
|
|
"https://api.thecatapi.com/v1/images/search?limit=100&api_key=",
|
|
timeout=REQUEST_TIMEOUT,
|
|
)
|
|
requests_send += 1
|
|
response = json.loads(res.text)
|
|
urls = [cat.get("url") for cat in response]
|
|
|
|
Path("./CATS2").mkdir(parents=True, exist_ok=True)
|
|
for url in urls:
|
|
_download_single_image(url)
|