mirror of
https://github.com/kuhyx/testsAndMisc.git
synced 2026-07-04 16:23:04 +02:00
- Converted os.path patterns to pathlib.Path in 15+ files - os.path.join → Path / - os.path.dirname → Path.parent - os.path.exists → Path.exists() - os.path.isfile → Path.is_file() - os.path.abspath → Path.resolve() - os.mkdir → Path.mkdir() - os.listdir → Path.iterdir() - os.getcwd → Path.cwd() - os.replace → Path.replace() - Updated function type hints to accept str | Path Added PTH123 (open() vs Path.open()) to global ignores as stylistic preference
56 lines
1.4 KiB
Python
56 lines
1.4 KiB
Python
"""Download cat images from TheCatAPI.
|
|
|
|
Fetches cat images in batches and saves them to a local directory.
|
|
"""
|
|
|
|
import json
|
|
import logging
|
|
from pathlib import Path
|
|
|
|
import requests
|
|
|
|
_logger = logging.getLogger(__name__)
|
|
|
|
MAX_REQUESTS = 90
|
|
REQUEST_TIMEOUT = 30 # seconds
|
|
|
|
|
|
def _download_single_image(url: str) -> None:
|
|
"""Download and save a single image from URL.
|
|
|
|
Args:
|
|
url: The URL of the image to download.
|
|
"""
|
|
try:
|
|
# Get the image content
|
|
response = requests.get(url, timeout=REQUEST_TIMEOUT)
|
|
response.raise_for_status() # Raise an exception for HTTP errors
|
|
|
|
# Extract the image name from the URL
|
|
image_name = Path(url).name
|
|
image_path = Path("./CATS2/") / image_name
|
|
|
|
# Save the image to the directory
|
|
with open(image_path, "wb") as file:
|
|
file.write(response.content)
|
|
|
|
_logger.info("Saved %s as %s", url, image_path)
|
|
|
|
except requests.exceptions.RequestException:
|
|
_logger.exception("Failed to download %s", url)
|
|
|
|
|
|
requests_send = 0
|
|
while requests_send < MAX_REQUESTS:
|
|
res = requests.get(
|
|
"https://api.thecatapi.com/v1/images/search?limit=100&api_key=",
|
|
timeout=REQUEST_TIMEOUT,
|
|
)
|
|
requests_send += 1
|
|
response = json.loads(res.text)
|
|
urls = [cat.get("url") for cat in response]
|
|
|
|
Path("./CATS2").mkdir(parents=True, exist_ok=True)
|
|
for url in urls:
|
|
_download_single_image(url)
|