codedump: kemonopartydownloader.py comparison

comparison kemonopartydownloader.py @ 100:b14e2a096ebf

kemonopartydownloader.py: add --timeout, fix output also drive detection wasn't working LOL committer: GitHub <noreply@github.com>

author	Paper <37962225+mrpapersonic@users.noreply.github.com>
date	Sun, 14 Aug 2022 06:20:12 -0400
parents	2bccbf473ff4
children	f10492e8720b

comparison

equal deleted inserted replaced

-:2bccbf473ff4
+:b14e2a096ebf
 """
 Usage:
 kemonopartydownloader.py <url>... (--cookies <filename>)
 [--output <folder>]
 [--proxy <proxy>]
+[--timeout <seconds>]
 kemonopartydownloader.py -h | --help
 Arguments:
 <url>                        Kemono.party URL to download from
 -c --cookies <filename>      A Netscape-compatible cookies.txt file
 Options:
 -h --help                    Show this screen
 -o --output <folder>         Output folder, relative to the current directory
+[default: .]
 -p --proxy <proxy>           HTTP or HTTPS proxy (SOCKS5 with PySocks)
+-t --timeout <seconds>       Time between downloads [default: 1]
 """
 import docopt
 import http.cookiejar
 import os
 import re
 sanitize(i["title"])))
 os.remove(succeededjson["archives"][0]["fileName"])
 return 0
-def unzip(src_path: str, dst_dir: str, pwd=None) -> None:
+def unzip(src_path: str, dst_dir: str, pwd: str = None) -> None:
 with zipfile.ZipFile(src_path) as zf:
 members = zf.namelist()
 for member in members:
 arch_info = zf.getinfo(member)
 arch_name = arch_info.filename.replace('/', os.path.sep)
 def download_file(i: dict, x: dict, count: int) -> None:
 filename = "%s/%s_%dp_%s_%s" % (output, i["id"], count,
 sanitize(i["title"]), x["name"])
 amountdone = 0
-filesize = os.stat(filename).st_size if os.path.exists(filename) else 0
+filesize = 0
+if os.path.exists(filename):
+filesize = os.path.getsize(filename)
 serverhead = req.head("https://kemono.party/data" + x['path'],
 allow_redirects=True)
 for i in range(500):
 serverfilesize = int(serverhead.headers["Content-Length"])
 if filesize < serverfilesize:
 def parse_json(i: dict, count: int) -> None:
 unique_urls = []
 for url in find_urls(i["content"]):
 parsed_url = urllib.parse.urlparse(url)
 if parsed_url.netloc == "drive.google.com":
-if parsed_url.path.startswith("drive/folders"):
+if parsed_url.path.startswith("/drive/folders"):
 if url not in unique_urls:
 download_folder_from_google_drive(url)
 unique_urls.append(url)
-elif (parsed_url.path == "open" and
+elif (parsed_url.path == "/open" and
 parsed_url.query.startswith == "id"):
 if url not in unique_urls:
 download_file_from_google_drive(
 parsed_url.query.split("=")
 [-1])
 unique_urls.append(url)
-elif parsed_url.path.startswith("file/"):
+elif parsed_url.path.startswith("/file/"):
 if url not in unique_urls:
 download_file_from_google_drive(parsed_url.path.split("/")
 [-2])
 unique_urls.append(url)
 elif parsed_url.netloc in ["dropbox.com", "www.dropbox.com"]:
 while not os.path.exists("%s/%s_%dp_%s_%s"
 % (output, i["id"], count,
 sanitize(i["title"]), x["name"])):
 try:
 download_file(i, x, count)
-break
 except (HTTPError, BadStatusLine):
 while 1:
 time.sleep(10)
 download_file(i, x, count)
 except Exception as e:
 print(e)
-time.sleep(10)
+time.sleep(timeout)
 def get_amount_of_posts(s: str, u: str):
 amount = 0
 while 1:
 if args["--proxy"]:
 req.proxies = {
 "http": args["--proxy"],
 "https": args["--proxy"],
 }
+timeout = int(args["--timeout"])
 cj = http.cookiejar.MozillaCookieJar(args["--cookies"])
 cj.load(ignore_expires=True)
 req.cookies = cj
 elif url.split("/")[-2] == "user":
 service = url.split("/")[-3]
 user = url.split("/")[-1]
 pages = get_amount_of_posts(service, user)
-output = ""
+output = "%s/%s-%s" % (args["--output"], service, user)
-if args["--output"]:
-output = args.output + "/"
+if not os.path.exists(output):
-output += "%s-%s" % (service, user)
+os.mkdir(output)
 for page in range(pages):
 try:
 post
 userdata = req.get("https://kemono.party/api/%s/user/%s/post/%s"

Mercurial > codedump

comparison kemonopartydownloader.py @ 100:b14e2a096ebf