from dataclasses import dataclass from io import StringIO from lxml import html, etree from github import Github import multiprocessing import pihole as ph import qbittorrent import configparser import requests import datetime import urllib import docker import random import queue import json import time import os theLastId = 0 CONFIG = configparser.ConfigParser(interpolation = None) CONFIG.read("edaweb.conf") def humanbytes(B): 'Return the given bytes as a human friendly KB, MB, GB, or TB string' B = float(B) KB = float(1024) MB = float(KB ** 2) # 1,048,576 GB = float(KB ** 3) # 1,073,741,824 TB = float(KB ** 4) # 1,099,511,627,776 if B < KB: return '{0} {1}'.format(B,'Bytes' if 0 == B > 1 else 'Byte') elif KB <= B < MB: return '{0:.2f} KB'.format(B/KB) elif MB <= B < GB: return '{0:.2f} MB'.format(B/MB) elif GB <= B < TB: return '{0:.2f} GB'.format(B/GB) elif TB <= B: return '{0:.2f} TB'.format(B/TB) @dataclass class SafebooruImage: id_: int url: str searchTags: list tags: list source: str imurl: str def remove_tag(self, tag): return list(set(self.searchTags).difference(set([tag]))) @dataclass class DownloadedImage: imurl: str def __enter__(self): self.filename = os.path.join("static", "images", "random.jpg") req = urllib.request.Request(self.imurl, headers = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_5_8) AppleWebKit/534.50.2 (KHTML, like Gecko) Version/5.0.6 Safari/533.22.3'}) mediaContent = urllib.request.urlopen(req).read() with open(self.filename, "wb") as f: f.write(mediaContent) return self.filename def __exit__(self, type, value, traceback): os.remove(self.filename) def get_num_pages(tags): pages_url = "https://safebooru.org/index.php?page=post&s=list&tags=%s" % "+".join(tags) tree = html.fromstring(requests.get(pages_url).content) try: finalpage_element = tree.xpath("/html/body/div[6]/div/div[2]/div[2]/div/a[12]")[0] except IndexError: return 1 else: return int(int(urllib.parse.parse_qs(finalpage_element.get("href"))["pid"][0]) / (5*8)) def get_id_from_url(url): return int(urllib.parse.parse_qs(url)["id"][0]) def get_random_image(tags): global theLastId searchPage = random.randint(1, get_num_pages(tags)) * 5 * 8 url = "https://safebooru.org/index.php?page=post&s=list&tags=%s&pid=%i" % ("+".join(tags), searchPage) tree = html.fromstring(requests.get(url).content) imageElements = [e for e in tree.xpath("/html/body/div[6]/div/div[2]/div[1]")[0].iter(tag = "a")] try: element = random.choice(imageElements) except IndexError: # raise ConnectionError("Couldn't find any images") return get_random_image(tags) url = "https://safebooru.org/" + element.get("href") if get_id_from_url(url) == theLastId: return get_random_image(tags) theLastId = get_id_from_url(url) try: sbi = SafebooruImage( id_ = get_id_from_url(url), url = url, tags = element.find("img").get("alt").split(), searchTags = tags, source = fix_source_url(get_source(url)), imurl = get_imurl(url) ) except (ConnectionError, KeyError) as e: print("[ERROR]", e) return get_random_image(tags) if link_deleted(sbi.url): print("Retried since the source was deleted...") return get_random_image(tags) return sbi def get_source(url): tree = html.fromstring(requests.get(url).content) for element in tree.xpath('//*[@id="stats"]')[0].iter("li"): if element.text.startswith("Source: h"): return element.text[8:] elif element.text.startswith("Source:"): for child in element.iter(): if child.get("href") is not None: return child.get("href") raise ConnectionError("Couldn't find source image for id %i" % get_id_from_url(url)) def fix_source_url(url): parsed = urllib.parse.urlparse(url) if parsed.netloc == "www.pixiv.net": return "https://www.pixiv.net/en/artworks/" + urllib.parse.parse_qs(parsed.query)["illust_id"][0] elif parsed.netloc in ["bishie.booru.org", "www.secchan.net"]: return ConnectionError("Couldn't get source") elif "pximg.net" in parsed.netloc or "pixiv.net" in parsed.netloc: return "https://www.pixiv.net/en/artworks/" + parsed.path.split("/")[-1][:8] elif parsed.netloc == "twitter.com": return url.replace("twitter.com", "nitter.eda.gay") return url def get_imurl(url): tree = html.fromstring(requests.get(url).content) return tree.xpath('//*[@id="image"]')[0].get("src") def link_deleted(url): text = requests.get(url).text return text[text.find("