{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import polars as pl\n", "from pathlib import Path\n", "import logging\n", "from utils import set_up_logging, delete_corrupt_images\n", "\n", "set_up_logging(Path(\"../logs\"))\n", "\n", "RETRY_COUNT = 10\n", "WORKER_COUNT = 16\n", "HTTP_TIMEOUT = 120\n", "TARGET_PATH = Path(\"/mnt/wsl/PHYSICALDRIVE0p1/downloaded-unsplash\")\n", "\n", "TARGET_PATH = TARGET_PATH.resolve()\n", "assert TARGET_PATH.exists()" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "delete_corrupt_images(list(TARGET_PATH.glob(\"*\")))" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| photo_id | photo_image_url |
|---|---|
| str | str |
| "---jvVJZ34o" | "https://images.unsplash.com/ph… |
| "--0-I4GpLZU" | "https://images.unsplash.com/ph… |
| "--2IBUMom1I" | "https://images.unsplash.com/ph… |
| "--2sDoKRgCg" | "https://images.unsplash.com/ph… |
| "--5QEAiAfgE" | "https://images.unsplash.com/ph… |
| "--6JlGcHl-w" | "https://images.unsplash.com/ph… |
| "--6sqOMUDs8" | "https://images.unsplash.com/ph… |
| "--97ozlPF1A" | "https://images.unsplash.com/ph… |
| "--D4Gg8RhIk" | "https://images.unsplash.com/ph… |
| "--EUYLhCTdc" | "https://images.unsplash.com/ph… |