Refactor image downloading logic and add progress bar (python)

- Introduces a progress bar using the `tqdm` library to track the progress of image downloads, instead of print messages.
- Any errors that occur during the downloads are logged and reported after all downloads are completed.
This commit is contained in:
Harshit Shukla 2024-09-25 20:37:20 +05:30
parent 82e50c64f0
commit b109c1c6ae

View file

@ -4,24 +4,28 @@ import os
import time import time
import aiohttp import aiohttp
import asyncio import asyncio
from tqdm import tqdm
from urllib.parse import urlparse from urllib.parse import urlparse
url = 'https://storage.googleapis.com/panels-api/data/20240916/media-1a-i-p~s' url = 'https://storage.googleapis.com/panels-api/data/20240916/media-1a-i-p~s'
async def delay(ms): async def delay(ms):
await asyncio.sleep(ms / 1000) await asyncio.sleep(ms / 1000)
async def download_image(session, image_url, file_path): async def download_image(session, image_url, file_path, error_log):
try: try:
async with session.get(image_url) as response: async with session.get(image_url) as response:
if response.status != 200: if response.status != 200:
raise Exception(f"Failed to download image: {response.status}") raise Exception(f"Error code: {response.status}")
content = await response.read() content = await response.read()
with open(file_path, 'wb') as f: with open(file_path, 'wb') as f:
f.write(content) f.write(content)
except Exception as e: except Exception as e:
print(f"Error downloading image: {str(e)}") error_log.append(f"Error downloading image {image_url}[{str(e)}]")
async def main(): async def main():
error_log = []
try: try:
async with aiohttp.ClientSession() as session: async with aiohttp.ClientSession() as session:
async with session.get(url) as response: async with session.get(url) as response:
@ -39,24 +43,35 @@ async def main():
print(f"📁 Created directory: {download_dir}") print(f"📁 Created directory: {download_dir}")
file_index = 1 file_index = 1
total_images = len([key for key, subproperty in data.items() if subproperty.get('dhd')])
# initialize progress bar with the total number of images
with tqdm(total=total_images, desc="Downloading", unit="image", colour="red") as pbar:
for key, subproperty in data.items(): for key, subproperty in data.items():
if subproperty and subproperty.get('dhd'): if subproperty and subproperty.get('dhd'):
image_url = subproperty['dhd'] image_url = subproperty['dhd']
print(f"🔍 Found image URL!")
parsed_url = urlparse(image_url) parsed_url = urlparse(image_url)
ext = os.path.splitext(parsed_url.path)[-1] or '.jpg' ext = os.path.splitext(parsed_url.path)[-1] or '.jpg'
filename = f"{file_index}{ext}" filename = f"{file_index}{ext}"
file_path = os.path.join(download_dir, filename) file_path = os.path.join(download_dir, filename)
await download_image(session, image_url, file_path, error_log)
await download_image(session, image_url, file_path) pbar.update(1)
print(f"🖼️ Saved image to {file_path}")
file_index += 1 file_index += 1
await delay(250) await delay(250)
except Exception as e: except Exception as e:
print(f"Error: {str(e)}") print(f"Error: {str(e)}")
# After all downloads, report any errors that occurred
if error_log:
print("\n⚠️ The following errors occurred during downloads:")
for error in error_log:
print(error)
else:
print("\n✅ All images downloaded successfully!")
def ascii_art(): def ascii_art():
print(""" print("""
/$$ /$$ /$$ /$$ /$$$$$$$ /$$$$$$ /$$$$$$$ /$$ /$$ /$$ /$$ /$$$$$$$ /$$$$$$ /$$$$$$$