explosum.net download script

📅 2021-02-14T12:35:07.000Z
👁️ 218 katselukertaa
🔓 Julkinen


import requests
from bs4 import BeautifulSoup
import os

dl_dir = './images/'

nmbr_of_pages = 5785

for i in range(15, nmbr_of_pages+1):
    idx = str(i)
    r = requests.get("https://explosm.net/comics/" + idx + "/")
    if r.status_code == 200:
        try:
            print("Downloading image", idx)
            soup = BeautifulSoup(r.content, features="html.parser")
            img_url = soup.head.find("meta", {"property": "og:image"})["content"]
            print(img_url)

            img_r = requests.get(img_url)
            with open("./images/" + os.path.basename(img_url), 'wb') as f:
                f.write(img_r.content)
        except:
            print("Skipping image", idx)
    else:
        print("Skipping image", idx)