From 425b13d7a4df033d00469c77fd21b91cc955bf45 Mon Sep 17 00:00:00 2001 From: Nick Hahn Date: Thu, 15 Sep 2022 18:34:42 +0200 Subject: [PATCH] Preserve old runs in pads.json --- hedgedoc-image.py | 19 ++++++++++++++++--- 1 file changed, 16 insertions(+), 3 deletions(-) diff --git a/hedgedoc-image.py b/hedgedoc-image.py index 184b275..dcb5d90 100644 --- a/hedgedoc-image.py +++ b/hedgedoc-image.py @@ -7,6 +7,7 @@ import os from urllib.parse import urlparse from typing import List +from os.path import exists PATH = "images/" NEW_NETLOC = "" @@ -17,8 +18,8 @@ pads_json = [] os.makedirs(PATH, exist_ok=True) os.makedirs(PATH + "uploads", exist_ok=True) -# TODO: Loop detection -# TODO: Recursion + + class Image: def __init__(self, _old_url: str) -> None: self.old_url = _old_url @@ -26,7 +27,6 @@ class Image: self.new_url = "." + old.path; def download(self): - print("HERE") r = requests.get(self.old_url) p = PATH + urlparse(self.old_url).path with open(p, 'wb') as f: @@ -116,6 +116,19 @@ if __name__ == "__main__": args = parser.parse_args() + old_file = [] + + if exists("pads.json"): + with open("pads.json", "r") as f: + old_file = json.load(f) + + for entry in old_file: + seen_pads.append(entry["old_url"]) + + pads_json.extend(old_file) + print(f"Seen Pads: {seen_pads}") + + NEW_NETLOC = args.new_pad_url[0] pad = PadPage(args.pad_url[0]) pad.download_and_process_content()