#!/usr/bin/env python3 import os import requests import bs4 os.system('mkdir -p infodump/thumbs') url = 'https://moneroinfodump.neocities.org/' contents = requests.get(url, timeout=15).content soup = bs4.BeautifulSoup(contents, 'html.parser') images = soup.find_all('img') links = soup.find_all('a') for image in images: img = image.get('src') if img.startswith('http'): os.system(f'wget -q --no-clobber -O infodump/{os.path.basename(img)} {img}') image['src'] = os.path.basename(img) elif img.startswith('data:image/png'): pass else: os.system(f'wget -q --no-clobber -O infodump/{img} {img}') image['src'] = img for link in links: href = link.get('href') if href and href.startswith('https://i.imgur.com'): link['href'] = os.path.basename(href) with open('infodump/index.html', 'w') as f: f.write(str(soup))