#!/usr/bin/env python3

import os
import requests
import bs4

os.system('mkdir -p infodump/thumbs')
url = 'https://moneroinfodump.neocities.org/'
contents = requests.get(url, timeout=15).content
soup = bs4.BeautifulSoup(contents, 'html.parser')
images = soup.find_all('img')
links = soup.find_all('a')

for image in images:
    img = image.get('src')
    if img.startswith('http'):
        os.system(f'wget -q --no-clobber -O infodump/{os.path.basename(img)} {img}')
        image['src'] = os.path.basename(img)
    elif img.startswith('data:image/png'):
        pass
    else:
        os.system(f'wget -q --no-clobber -O infodump/{img} {img}')
        image['src'] = img

for link in links:
    href = link.get('href')
    if href and href.startswith('https://i.imgur.com'):
        link['href'] = os.path.basename(href)

with open('infodump/index.html', 'w') as f:
    f.write(str(soup))